Sample stimuli

How to use

from brainscore_vision import load_benchmark
benchmark = load_benchmark("Baker2022frankenstein-accuracy_delta")
score = benchmark(my_model)

Benchmark API

Code examples

Model scores

Score Legend Min Alignment Max Alignment

Rank	Model	Score
1	convnext_xlarge:fb_in22k_ft_in1k	.983
2	vit_huge_patch14_clip_224:laion2b_ft_in12k_in1k	.974
3	nasnet_large	.972
4	vit_base_patch16_clip_224:openai_ft_in12k_in1k	.939
5	resnext101_32x48d_wsl	.929
6	AdvProp_efficientnet-b7	.929
7	resnet50_imagenet_full	.929
8	vit_large_patch14_clip_224:openai_ft_in1k	.899
9	resnet152_imagenet_full	.897
10	resnext101_32x8d_wsl	.889
11	convnext_large:fb_in22k_ft_in1k	.887
12	convnext_base_imagenet_full_seed-0	.874
13	resnet_152_v2	.873
14	voneresnet-50	.867
15	efficientnet_b1_imagenet_full	.867
16	resnext101_32x16d_wsl	.865
17	Res2Net50_26w_4s	.862
18	AdvProp_efficientnet-b8	.858
19	vit_relpos_base_patch32_plus_rpn_256:sw_in1k	.855
20	deit_base_imagenet_full_seed-0	.854
21	vit_large_patch14_clip_224:laion2b_ft_in12k_in1k	.850
22	inception_v1	.844
23	vit_tiny_r_s16_p8_384:augreg_in21k_ft_in1k	.824
24	tv_efficientnet-b1	.806
25	resnet50-SIN	.803
26	resnet50-SIN_IN	.801
27	convnext_femto_ols:d1_in1k	.798
28	AdvProp_efficientnet-b4	.793
29	effnetb1_cutmix_augmix_sam_e1_5avg_424x377	.775
30	inception_v3	.770
31	BiT-S-R101x3	.767
32	vonegrcnn_47e	.767
33	resnet18_imagenet_full	.766
34	effnetb1_272x240	.766
35	vit_relpos_base_patch16_clsgap_224:sw_in1k	.761
36	vit_large_patch14_clip_336:openai_ft_in12k_in1k	.754
37	swin_small_patch4_window7_224:ms_in22k_ft_in1k	.741
38	resnet50-VITO-8deg-cc	.731
39	resnet50-vitoimagevidnet8	.731
40	vit_large_patch14_clip_224:laion2b_ft_in1k	.727
41	convnext_tiny:in12k_ft_in1k	.724
42	ReAlnet04	.717
43	convnext_small_imagenet_full_seed-0	.715
44	resnet_50_v2	.714
45	convnext_base:clip_laiona_augreg_ft_in1k_384	.713
46	cvt_cvt-13-224-in1k_4_LucyV4	.712
47	cvt_cvt-w24-384-in22k_finetuned-in1k_4	.698
48	cvt_cvt-21-224-in1k_4_LucyV4	.696
49	grcnn	.692
50	mobilenet_v2_1_3_224	.681
51	resnet50-moclr8deg	.680
52	nasnet_mobile	.671
53	inception_v3_pytorch	.666
54	resnet50_robust_l2_eps1	.662
55	densenet-169	.658
56	BiT-S-R50x3	.645
57	cvt_cvt-13-384-in22k_finetuned-in1k_4_LucyV4	.644
58	cv_18_dagger_408_pretrained	.641
59	vit_large_patch14_clip_224:openai_ft_in12k_in1k	.623
60	convnext_large_imagenet_full_seed-0	.617
61	vit_base_patch16_clip_224:openai_ft_in1k	.608
62	resnet_101_v2	.607
63	AdvProp_efficientnet-b6	.599
64	convnext_tiny_imagenet_full_seed-0	.578
65	convnext_tiny_sup	.572
66	effnetb1_cutmixpatch_SAM_robust32_avge6e8e9e10_manylayers_324x288	.568
67	cvt_cvt-21-384-in1k_4_LucyV4	.568
68	ReAlnet10	.567
69	BiT-S-R101x1	.558
70	vgg_16	.545
71	cvt_cvt-13-384-in1k_4_LucyV4	.539
72	vonegrcnn_52e_full	.536
73	deit_small_imagenet_full_seed-0	.527
74	effnetb1_cutmixpatch_augmix_robust32_avge4e7_manylayers_324x288	.523
75	voneresnet-50-robust	.503
76	efficientnet_b0	.503
77	ReAlnet07	.494
78	resnet101_imagenet_full	.487
79	mobilenet_v2_1_0_224	.485
80	ReAlnet03	.485
81	BiT-S-R152x2	.465
82	efficientnet_b0_imagenet_full	.464
83	AT_efficientnet-b2	.463
84	AdvProp_efficientnet-b2	.463
85	ReAlnet08	.462
86	pnasnet_large_pytorch	.457
87	resnet50_robust_l2_eps3	.448
88	imagenet_l2_3_0	.448
89	resnet-50-robust	.448
90	ReAlnet09	.435
91	convnext_xxlarge:clip_laion2b_soup_ft_in1k	.427
92	densenet-121	.420
93	BiT-S-R50x1	.418
94	deit_large_imagenet_full_seed-0	.410
95	xception	.398
96	vonegrcnn_62e_nobn	.395
97	resnet50-barlow	.378
98	resnet_101_v1	.374
99	antialiased-r50	.372
100	densenet-201	.365
101	densenet_201_pytorch	.365
102	ReAlnet01	.362
103	ReAlnet_incorrect	.362
104	vgg_19	.343
105	resnet50-vicregl0p9	.339
106	resnet50_tutorial	.335
107	resnet_50_v1	.335
108	resnet50-sup	.335
109	ReAlnet06	.334
110	ReAlnet02	.314
111	resnext101_32x32d_wsl	.313
112	ReAlnet05	.310
113	resnet34_imagenet_full	.308
114	vit_large_patch14_clip_336:laion2b_ft_in1k	.301
115	mobilenet_v2_1_0_128	.286
116	ViT_L_32_imagenet1k	.284
117	BiT-S-R152x4	.282
118	efficientnet_b2_imagenet_full	.278
119	mobilenet_v2_1_0_192	.276
120	alexnet_ks_torevert	.270
121	convnext_large_mlp:clip_laion2b_augreg_ft_in1k_384	.257
122	resnet50-SIN_IN_IN	.232
123	resnet_SIN_IN_FT_IN	.232
124	shufflenet_v2_x1_0	.220
125	blt_vs	.212
126	mobilenet_v2_0_5_192	.204
127	inception_v4	.201
128	AlexNet_SIN	.160
129	pnasnet_large	.156
130	custom_model_cv_18_dagger_408	.155
131	convnext_small_imagenet_100_seed-0	.142
132	mobilenet_v2_0_5_224	.131
133	alexnet_training_seed_09	.119
134	vit_huge_patch14_clip_336:laion2b_ft_in12k_in1k	.111
135	focalnet_tiny_lrf_in1k	.089
136	convnext_small_imagenet_10_seed-0	.042
137	resnet-152_v2_pytorch	.038
138	convnext_small_imagenet_1_seed-0	.007
139	grcnn_109	.006
140	resnet50-vicregl0p75	.003
141	resnet50_imagenet_100_seed-0	.002
142	mobilenet_v2_0_75_160	.000
143	voneresnet-50-non_stochastic	.000
144	alexnet_training_seed_08	.000
145	mobilenet_v2_0_75_192	.000
146	alexnet_training_seed_04	.000
147	mobilenet_v2_0_75_224	.000
148	cvt_cvt-21-384-in22k_finetuned-in1k_4_LucyV4	.000
149	mobilevit_small	.000
150	artResNet18_1	.000
151	mobilenet_v2_1_4_224	.000
152	alexnet_training_seed_02	.000
153	alexnet_training_seed_06	.000
154	alexnet_training_seed_05	.000
155	alexnet_training_seed_01	.000
156	deit_small_imagenet_10_seed-0	.000
157	resnet50_imagenet_10_seed-0	.000
158	resnet_152_v1	.000
159	alexnet_training_seed_03	.000
160	alexnet_training_seed_10	.000
161	resnet50_eMMCR_Vanilla	.000
162	deit_small_imagenet_100_seed-0	.000
163	mobilenet_v2_1-4_224_pytorch	.000
164	mobilenet_v2_1_0_160	.000
165	deit_small_imagenet_1_seed-0	.000
166	alexnet_training_seed_07	.000
167	resnet50_imagenet_1_seed-0	.000
168	ReAlnet08_cornet	X
169	briaai_rmbg_1_4	X
170	yolos_tiny	X
171	antialiased-rnext101_32x8d	X
172	hmax	X
173	resnet18_imagenet21kP	X
174	ConvLSTM	X
175	PredRNN	X
176	SimVP	X
177	TAU	X
178	regnet_y_400mf	X
179	MIM	X
180	ReAlnet03_cornet	X
181	resnet18_ecoset_full	X
182	ReAlnet02_cornet	X
183	resnet34_ecoset_full	X
184	VOneCORnet-S	X
185	resnet50_ecoset_full	X
186	ReAlnet01_cornet	X
187	resnet101_ecoset_full	X
188	yudixie_resnet50_translation_reg_0_240908	X
189	yudixie_resnet18_distance_translation_0_240719	X
190	ReAlnet04_cornet	X
191	yudixie_resnet50_rotation_reg_0_240908	X
192	yudixie_resnet18_translation_rotation_0_240719	X
193	yudixie_resnet50_distance_rotation_0_240908	X
194	yudixie_resnet18_distance_rotation_0_240719	X
195	yudixie_resnet18_category_class_0_240719	X
196	resnet-18_test_m	X
197	yudixie_resnet50_distance_translation_0_240908	X
198	resnet152_ecoset_full	X
199	yudixie_resnet18_random_0_240719	X
200	yudixie_resnet18_cat_obj_class_all_latents_0_240719	X
201	ReAlnet05_cornet	X
202	yudixie_resnet18_distance_translation_rotation_0_240719	X
203	yudixie_resnet18_object_class_0_240719	X
204	yudixie_resnet18_rotation_reg_0_240719	X
205	yudixie_resnet18_imagenet1kpret_0_240719	X
206	yudixie_resnet18_translation_reg_0_240719	X
207	yudixie_resnet18_distance_reg_0_240719	X
208	efficientnet-b7	X
209	ReAlnet06_cornet	X
210	yudixie_resnet50_translation_rotation_0_240908	X
211	ReAlnet07_cornet	X
212	yudixie_resnet50_distance_reg_0_240908	X
213	omnivore_swinB	X
214	resnet50-vicreg	X
215	antialias-resnet152	X
216	omnivore_swinS	X
217	ReAlnet09_cornet	X
218	yudixie_resnet50_category_class_0_240908	X
219	yudixie_resnet50_object_class_0_240908	X
220	yudixie_resnet50_cat_obj_class_all_latents_0_240908	X
221	yudixie_resnet50_random_0_240908	X
222	yudixie_resnet50_imagenet1kpret_0_240908	X
223	yudixie_resnet50_distance_translation_rotation_0_240908	X
224	ReAlnet10_cornet	X

Benchmark bibtex

@article{BAKER2022104913,
                title = {Deep learning models fail to capture the configural nature of human shape perception},
                journal = {iScience},
                volume = {25},
                number = {9},
                pages = {104913},
                year = {2022},
                issn = {2589-0042},
                doi = {https://doi.org/10.1016/j.isci.2022.104913},
                url = {https://www.sciencedirect.com/science/article/pii/S2589004222011853},
                author = {Nicholas Baker and James H. Elder},
                keywords = {Biological sciences, Neuroscience, Sensory neuroscience},
                abstract = {Summary
                A hallmark of human object perception is sensitivity to the holistic configuration of the local shape features of an object. Deep convolutional neural networks (DCNNs) are currently the dominant models for object recognition processing in the visual cortex, but do they capture this configural sensitivity? To answer this question, we employed a dataset of animal silhouettes and created a variant of this dataset that disrupts the configuration of each object while preserving local features. While human performance was impacted by this manipulation, DCNN performance was not, indicating insensitivity to object configuration. Modifications to training and architecture to make networks more brain-like did not lead to configural processing, and none of the networks were able to accurately predict trial-by-trial human object judgements. We speculate that to match human configural sensitivity, networks must be trained to solve a broader range of object tasks beyond category recognition.}
        }

Ceiling

Not available

Data: Baker2022frankenstein

Metric: accuracy_delta