{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,15]],"date-time":"2026-01-15T06:50:17Z","timestamp":1768459817743,"version":"3.49.0"},"update-to":[{"DOI":"10.1371\/journal.pcbi.1008017","type":"new_version","label":"New version","source":"publisher","updated":{"date-parts":[[2020,7,31]],"date-time":"2020-07-31T00:00:00Z","timestamp":1596153600000}}],"reference-count":67,"publisher":"Public Library of Science (PLoS)","issue":"7","license":[{"start":{"date-parts":[[2020,7,21]],"date-time":"2020-07-21T00:00:00Z","timestamp":1595289600000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"DOI":"10.13039\/501100001711","name":"Schweizerischer Nationalfonds zur F\u00f6rderung der Wissenschaftlichen Forschung","doi-asserted-by":"publisher","award":["176153"],"award-info":[{"award-number":["176153"]}],"id":[{"id":"10.13039\/501100001711","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["www.ploscompbiol.org"],"crossmark-restriction":false},"short-container-title":["PLoS Comput Biol"],"DOI":"10.1371\/journal.pcbi.1008017","type":"journal-article","created":{"date-parts":[[2020,7,21]],"date-time":"2020-07-21T18:28:28Z","timestamp":1595356108000},"page":"e1008017","update-policy":"https:\/\/doi.org\/10.1371\/journal.pcbi.corrections_policy","source":"Crossref","is-referenced-by-count":41,"title":["Capsule networks as recurrent models of grouping and segmentation"],"prefix":"10.1371","volume":"16","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-5120-9750","authenticated-orcid":true,"given":"Adrien","family":"Doerig","sequence":"first","affiliation":[]},{"given":"Lynn","family":"Schmittwilken","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7589-5385","authenticated-orcid":true,"given":"Bilge","family":"Sayim","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4210-7570","authenticated-orcid":true,"given":"Mauro","family":"Manassi","sequence":"additional","affiliation":[]},{"given":"Michael H.","family":"Herzog","sequence":"additional","affiliation":[]}],"member":"340","published-online":{"date-parts":[[2020,7,21]]},"reference":[{"key":"pcbi.1008017.ref001","doi-asserted-by":"crossref","first-page":"415","DOI":"10.1016\/j.neuron.2012.01.010","article-title":"How Does the Brain Solve Visual Object Recognition?","volume":"73","author":"JJ DiCarlo","year":"2012","journal-title":"Neuron"},{"key":"pcbi.1008017.ref002","doi-asserted-by":"crossref","first-page":"106","DOI":"10.1113\/jphysiol.1962.sp006837","article-title":"Receptive fields, binocular interaction and functional architecture in the cat\u2019s visual cortex","volume":"160","author":"DH Hubel","year":"1962","journal-title":"The Journal of physiology"},{"key":"pcbi.1008017.ref003","first-page":"1097","article-title":"Imagenet classification with deep convolutional neural networks","author":"A Krizhevsky","year":"2012","journal-title":"Advances in neural information processing systems"},{"key":"pcbi.1008017.ref004","doi-asserted-by":"crossref","first-page":"1204","DOI":"10.1126\/science.aar6170","article-title":"Neural scene representation and rendering","volume":"360","author":"SA Eslami","year":"2018","journal-title":"Science"},{"key":"pcbi.1008017.ref005","first-page":"262","volume-title":"Texture Synthesis Using Convolutional Neural Networks.","author":"L Gatys","year":"2015"},{"key":"pcbi.1008017.ref006","article-title":"A style-based generator architecture for generative adversarial networks.","author":"T Karras","year":"2018","journal-title":"arXiv preprint arXiv:181204948"},{"key":"pcbi.1008017.ref007","doi-asserted-by":"crossref","first-page":"571","DOI":"10.1016\/S0166-2236(00)01657-X","article-title":"The distinct modes of vision offered by feedforward and recurrent processing","volume":"23","author":"VA Lamme","year":"2000","journal-title":"Trends in neurosciences"},{"key":"pcbi.1008017.ref008","first-page":"201905544","article-title":"Recurrence is required to capture the representational dynamics of the human visual system","author":"TC Kietzmann","year":"2019","journal-title":"Proceedings of the National Academy of Sciences"},{"key":"pcbi.1008017.ref009","doi-asserted-by":"crossref","first-page":"e1006580","DOI":"10.1371\/journal.pcbi.1006580","article-title":"Beyond Bouma\u2019s window: How to explain global aspects of crowding?","volume":"15","author":"A Doerig","year":"2019","journal-title":"PLOS Computational Biology"},{"key":"pcbi.1008017.ref010","first-page":"213","volume-title":"Comparing the ability of humans and DNNs to recognise closed contours in cluttered images","author":"CM Funke","year":"2018"},{"key":"pcbi.1008017.ref011","article-title":"One pixel attack for fooling deep neural networks","author":"J Su","year":"2019","journal-title":"IEEE Transactions on Evolutionary Computation"},{"key":"pcbi.1008017.ref012","article-title":"Intriguing properties of neural networks.","author":"C Szegedy","year":"2013","journal-title":"arXiv preprint arXiv:13126199."},{"key":"pcbi.1008017.ref013","article-title":"ImageNet-trained CNNs are biased towards texture; increasing shape bias improves accuracy and robustness.","author":"R Geirhos","year":"2018","journal-title":"arXiv preprint arXiv:181112231."},{"key":"pcbi.1008017.ref014","doi-asserted-by":"crossref","first-page":"e1006613","DOI":"10.1371\/journal.pcbi.1006613","article-title":"Deep convolutional networks do not classify based on global object shape","volume":"14","author":"N Baker","year":"2018","journal-title":"PLoS computational biology"},{"key":"pcbi.1008017.ref015","article-title":"Approximating CNNs with Bag-of-local-Features models works surprisingly well on ImageNet.","author":"W Brendel","year":"2019","journal-title":"arXiv preprint arXiv:190400760."},{"key":"pcbi.1008017.ref016","doi-asserted-by":"crossref","first-page":"4760","DOI":"10.1523\/JNEUROSCI.3073-18.2019","article-title":"Neural coding for shape and texture in macaque area V4","volume":"39","author":"T Kim","year":"2019","journal-title":"Journal of Neuroscience"},{"key":"pcbi.1008017.ref017","first-page":"744268","article-title":"Crowding Reveals Fundamental Differences in Local vs. Global Processing in Humans and Machines.","author":"A Doerig","year":"2019","journal-title":"bioRxiv."},{"key":"pcbi.1008017.ref018","author":"K Hermann","year":"2019","journal-title":"Exploring CNN Inductive Biases: Shape vs. Texture. NeurIPS Workshop on Shared Visual Representations in Human & Machine Intelligence."},{"key":"pcbi.1008017.ref019","doi-asserted-by":"crossref","first-page":"248","DOI":"10.1109\/CVPR.2009.5206848","article-title":"Imagenet: A large-scale hierarchical image database.","author":"J Deng","year":"2009","journal-title":"2009 IEEE conference on computer vision and pattern recognition."},{"key":"pcbi.1008017.ref020","doi-asserted-by":"crossref","first-page":"e1003915","DOI":"10.1371\/journal.pcbi.1003915","article-title":"Deep supervised, but not unsupervised, models may explain IT cortical representation","volume":"10","author":"S-M Khaligh-Razavi","year":"2014","journal-title":"PLoS computational biology"},{"key":"pcbi.1008017.ref021","doi-asserted-by":"crossref","first-page":"8619","DOI":"10.1073\/pnas.1403112111","article-title":"Performance-optimized hierarchical models predict neural responses in higher visual cortex","volume":"111","author":"DL Yamins","year":"2014","journal-title":"Proceedings of the National Academy of Sciences"},{"key":"pcbi.1008017.ref022","article-title":"Psyphy: A psychophysics driven evaluation framework for visual recognition","author":"B RichardWebster","year":"2018","journal-title":"IEEE transactions on pattern analysis and machine intelligence"},{"key":"pcbi.1008017.ref023","doi-asserted-by":"crossref","first-page":"635","DOI":"10.1016\/j.visres.2007.12.009","article-title":"Crowding\u2014An essential bottleneck for object recognition: A mini-review","volume":"48","author":"DM Levi","year":"2008","journal-title":"Vision Research"},{"key":"pcbi.1008017.ref024","doi-asserted-by":"crossref","first-page":"160","DOI":"10.1016\/j.tics.2011.02.005","article-title":"Visual crowding: a fundamental limit on conscious perception and object recognition.","volume":"15","author":"D Whitney","year":"2011","journal-title":"Trends in Cognitive Sciences"},{"key":"pcbi.1008017.ref025","doi-asserted-by":"crossref","first-page":"767","DOI":"10.1016\/0042-6989(73)90041-2","article-title":"Visual interference in the parafoveal recognition of initial and final letters of words","volume":"13","author":"H Bouma","year":"1973","journal-title":"Vision Research"},{"key":"pcbi.1008017.ref026","doi-asserted-by":"crossref","first-page":"445","DOI":"10.1016\/j.conb.2008.09.008","article-title":"Crowding: a cortical constraint on object recognition","volume":"18","author":"DG Pelli","year":"2008","journal-title":"Current Opinion in Neurobiology"},{"key":"pcbi.1008017.ref027","doi-asserted-by":"crossref","first-page":"R127","DOI":"10.1016\/j.cub.2017.12.051","article-title":"Multi-level Crowding and the Paradox of Object Recognition in Clutter","volume":"28","author":"M Manassi","year":"2018","journal-title":"Current Biology"},{"key":"pcbi.1008017.ref028","doi-asserted-by":"crossref","first-page":"35","DOI":"10.1167\/16.3.35","article-title":"What crowding can tell us about object representations","volume":"16","author":"M Manassi","year":"2016","journal-title":"Journal of Vision"},{"key":"pcbi.1008017.ref029","doi-asserted-by":"crossref","first-page":"1137","DOI":"10.1016\/0042-6989(75)90012-7","article-title":"Temporal and spatial interference with vernier acuity","volume":"15","author":"G Westheimer","year":"1975","journal-title":"Vision research"},{"key":"pcbi.1008017.ref030","doi-asserted-by":"crossref","first-page":"963","DOI":"10.1016\/0042-6989(85)90207-X","article-title":"Vernier acuity, crowding and cortical magnification","volume":"25","author":"DM Levi","year":"1985","journal-title":"Vision research"},{"key":"pcbi.1008017.ref031","doi-asserted-by":"crossref","first-page":"e48054","DOI":"10.1371\/journal.pone.0048054","article-title":"Sequential grouping modulates the effect of non-simultaneous masking on auditory intensity resolution.","volume":"7","author":"D Oberfeld","year":"2012","journal-title":"PloS one"},{"key":"pcbi.1008017.ref032","doi-asserted-by":"crossref","first-page":"52","DOI":"10.1016\/j.visres.2015.04.016","article-title":"Perceptual grouping determines haptic contextual modulation","volume":"126","author":"KE Overvliet","year":"2016","journal-title":"Vision Research"},{"key":"pcbi.1008017.ref033","doi-asserted-by":"crossref","first-page":"5","DOI":"10.1167\/9.2.5","article-title":"Global stimulus configuration modulates crowding","volume":"9","author":"TP Saarela","year":"2009","journal-title":"Journal of Vision"},{"key":"pcbi.1008017.ref034","doi-asserted-by":"crossref","first-page":"433","DOI":"10.1038\/415433a","article-title":"Effects of grouping in contextual modulation","volume":"415","author":"MH Herzog","year":"2002","journal-title":"Nature"},{"key":"pcbi.1008017.ref035","doi-asserted-by":"crossref","first-page":"641","DOI":"10.1177\/0956797610368811","article-title":"Gestalt factors modulate basic spatial vision","volume":"21","author":"B Sayim","year":"2010","journal-title":"Psychological Science"},{"key":"pcbi.1008017.ref036","doi-asserted-by":"crossref","first-page":"17","DOI":"10.1167\/10.10.17","article-title":"The effect of spacing regularity on visual crowding","volume":"10","author":"TP Saarela","year":"2010","journal-title":"Journal of Vision"},{"key":"pcbi.1008017.ref037","doi-asserted-by":"crossref","first-page":"13","DOI":"10.1167\/12.10.13","article-title":"Grouping, pooling, and when bigger is better in visual crowding","volume":"12","author":"M Manassi","year":"2012","journal-title":"Journal of Vision"},{"key":"pcbi.1008017.ref038","doi-asserted-by":"crossref","first-page":"R352","DOI":"10.1016\/j.cub.2016.03.003","article-title":"How best to unify crowding?","volume":"26","author":"MV Pachai","year":"2016","journal-title":"Current Biology"},{"key":"pcbi.1008017.ref039","first-page":"3856","article-title":"Dynamic routing between capsules","author":"S Sabour","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"pcbi.1008017.ref040","doi-asserted-by":"crossref","first-page":"10","DOI":"10.1167\/13.13.10","article-title":"When crowding of crowding leads to uncrowding","volume":"13","author":"M Manassi","year":"2013","journal-title":"Journal of Vision"},{"key":"pcbi.1008017.ref041","doi-asserted-by":"crossref","first-page":"50","DOI":"10.1016\/j.visres.2013.03.010","article-title":"Crowding during restricted and free viewing","volume":"84","author":"JM Wallace","year":"2013","journal-title":"Vision Research"},{"key":"pcbi.1008017.ref042","doi-asserted-by":"crossref","first-page":"11","DOI":"10.1167\/14.6.11","article-title":"Large crowding zones in peripheral vision for briefly presented stimuli","volume":"14","author":"SP Tripathy","year":"2014","journal-title":"Journal of Vision"},{"key":"pcbi.1008017.ref043","doi-asserted-by":"crossref","first-page":"189","DOI":"10.1007\/BF00309083","article-title":"Perceptual integration of identity, location and colour.","volume":"48","author":"EA Styles","year":"1986","journal-title":"Psychological Research"},{"key":"pcbi.1008017.ref044","doi-asserted-by":"crossref","first-page":"187","DOI":"10.1088\/0954-898X_10_2_305","article-title":"Visual segmentation by contextual influences via intra-cortical interactions in the primary visual cortex","volume":"10","author":"Z Li","year":"1999","journal-title":"Network: computation in neural systems"},{"key":"pcbi.1008017.ref045","doi-asserted-by":"crossref","first-page":"739","DOI":"10.1038\/89532","article-title":"Compulsory averaging of crowded orientation signals in human vision","volume":"4","author":"L Parkes","year":"2001","journal-title":"Nature neuroscience"},{"key":"pcbi.1008017.ref046","doi-asserted-by":"crossref","first-page":"12","DOI":"10.1167\/4.12.12","article-title":"Crowding is unlike ordinary masking: Distinguishing feature integration from detection","volume":"4","author":"DG Pelli","year":"2004","journal-title":"Journal of Vision"},{"key":"pcbi.1008017.ref047","first-page":"19","article-title":"Challenges to pooling models of crowding: Implications for visual mechanisms","author":"R Rosenholtz","year":"2019","journal-title":"Journal of vision"},{"key":"pcbi.1008017.ref048","doi-asserted-by":"crossref","first-page":"520","DOI":"10.1038\/381520a0","article-title":"Speed of processing in the human visual system","volume":"381","author":"S Thorpe","year":"1996","journal-title":"nature"},{"key":"pcbi.1008017.ref049","article-title":"Deep neural networks in computational neuroscience","volume":"133504","author":"TC Kietzmann","year":"2018","journal-title":"bioRxiv"},{"key":"pcbi.1008017.ref050","article-title":"Disentangling neural mechanisms for perceptual grouping.","author":"J Kim","year":"2019","journal-title":"arXiv preprint arXiv:190601558."},{"key":"pcbi.1008017.ref051","doi-asserted-by":"crossref","first-page":"8835","DOI":"10.1073\/pnas.1719397115","article-title":"Recurrent computations for visual pattern completion","volume":"115","author":"H Tang","year":"2018","journal-title":"Proceedings of the National Academy of Sciences"},{"key":"pcbi.1008017.ref052","article-title":"Recurrent networks can recycle neural resources to flexibly trade speed for accuracy in visual recognition.","volume":"677237","author":"CJ Spoerer","year":"2019","journal-title":"bioRxiv."},{"key":"pcbi.1008017.ref053","article-title":"Sample-efficient image segmentation through recurrence.","author":"D Linsley","year":"2018","journal-title":"arXiv:181111356"},{"key":"pcbi.1008017.ref054","doi-asserted-by":"crossref","first-page":"359","DOI":"10.1016\/0893-6080(89)90020-8","article-title":"Multilayer feedforward networks are universal approximators.","volume":"2","author":"K Hornik","year":"1989","journal-title":"Neural networks."},{"key":"pcbi.1008017.ref055","article-title":"Depth in convolutional neural networks solves scene segmentation.","author":"N Seijdel","year":"2019","journal-title":"bioRxiv"},{"key":"pcbi.1008017.ref056","doi-asserted-by":"crossref","first-page":"399","DOI":"10.1146\/annurev-vision-091718-014951","article-title":"Deep learning: the good, the bad, and the ugly","volume":"5","author":"T Serre","year":"2019","journal-title":"Annual Review of Vision Science"},{"key":"pcbi.1008017.ref057","article-title":"Detecting and diagnosing adversarial images with class-conditional capsule reconstructions.","author":"Y Qin","year":"2019","journal-title":"arXiv preprint arXiv:190702957."},{"key":"pcbi.1008017.ref058","article-title":"Deflecting Adversarial Attacks.","author":"Y Qin","year":"2020","journal-title":"arXiv preprint arXiv:200207405."},{"key":"pcbi.1008017.ref059","author":"GE Hinton","year":"2018","journal-title":"Matrix capsules with EM routing"},{"key":"pcbi.1008017.ref060","doi-asserted-by":"crossref","unstructured":"Afshar P, Mohammadi A, Plataniotis KN. Brain tumor type classification via capsule networks. 2018 25th IEEE International Conference on Image Processing (ICIP). IEEE; 2018. pp. 3129\u20133133.","DOI":"10.1109\/ICIP.2018.8451379"},{"key":"pcbi.1008017.ref061","doi-asserted-by":"crossref","first-page":"1551","DOI":"10.3389\/fpsyg.2017.01551","article-title":"Recurrent convolutional neural networks: a better model of biological object recognition.","volume":"8","author":"CJ Spoerer","year":"2017","journal-title":"Frontiers in psychology."},{"key":"pcbi.1008017.ref062","doi-asserted-by":"crossref","first-page":"974","DOI":"10.1038\/s41593-019-0392-5","article-title":"Evidence that recurrent circuits are critical to the ventral stream\u2019s execution of core object recognition behavior","volume":"22","author":"K Kar","year":"2019","journal-title":"Nature neuroscience"},{"key":"pcbi.1008017.ref063","doi-asserted-by":"crossref","first-page":"483","DOI":"10.1037\/rev0000070","article-title":"Neural dynamics of grouping and segmentation explain properties of visual crowding.","volume":"124","author":"G Francis","year":"2017","journal-title":"Psychological review."},{"key":"pcbi.1008017.ref064","first-page":"234","article-title":"U-net: Convolutional networks for biomedical image segmentation","author":"O Ronneberger","year":"2015","journal-title":"International Conference on Medical image computing and computer-assisted intervention"},{"key":"pcbi.1008017.ref065","author":"R Girshick","year":"2018","journal-title":"Detectron"},{"key":"pcbi.1008017.ref066","article-title":"Sgdr: Stochastic gradient descent with warm restarts.","author":"I Loshchilov","year":"2016","journal-title":"arXiv preprint arXiv:160803983."},{"key":"pcbi.1008017.ref067","doi-asserted-by":"crossref","first-page":"782","DOI":"10.1121\/1.1910407","article-title":"PEST: Efficient estimates on probability functions","volume":"41","author":"M Taylor","year":"1967","journal-title":"The Journal of the Acoustical Society of America"}],"updated-by":[{"DOI":"10.1371\/journal.pcbi.1008017","type":"new_version","label":"New version","source":"publisher","updated":{"date-parts":[[2020,7,31]],"date-time":"2020-07-31T00:00:00Z","timestamp":1596153600000}}],"container-title":["PLOS Computational Biology"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/dx.plos.org\/10.1371\/journal.pcbi.1008017","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,7,31]],"date-time":"2020-07-31T17:45:31Z","timestamp":1596217531000},"score":1,"resource":{"primary":{"URL":"https:\/\/dx.plos.org\/10.1371\/journal.pcbi.1008017"}},"subtitle":[],"editor":[{"given":"Wolfgang","family":"Einh\u00e4user","sequence":"first","affiliation":[]}],"short-title":[],"issued":{"date-parts":[[2020,7,21]]},"references-count":67,"journal-issue":{"issue":"7","published-online":{"date-parts":[[2020,7,21]]}},"URL":"https:\/\/doi.org\/10.1371\/journal.pcbi.1008017","relation":{"new_version":[{"id-type":"doi","id":"10.1371\/journal.pcbi.1008017","asserted-by":"object"}]},"ISSN":["1553-7358"],"issn-type":[{"value":"1553-7358","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,7,21]]}}}