{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,21]],"date-time":"2026-01-21T15:42:34Z","timestamp":1769010154336,"version":"3.49.0"},"reference-count":32,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,10,27]],"date-time":"2024-10-27T00:00:00Z","timestamp":1729987200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,10,27]],"date-time":"2024-10-27T00:00:00Z","timestamp":1729987200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,10,27]]},"DOI":"10.1109\/icip51287.2024.10647295","type":"proceedings-article","created":{"date-parts":[[2024,9,27]],"date-time":"2024-09-27T18:34:45Z","timestamp":1727462085000},"page":"493-499","source":"Crossref","is-referenced-by-count":1,"title":["Vito: Vision Transformer Optimization Via Knowledge Distillation On Decoders"],"prefix":"10.1109","author":[{"given":"Giovanni","family":"Bellitto","sequence":"first","affiliation":[{"name":"University of Catania,PeRCeiVe Lab,Italy"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Renato","family":"Sortino","sequence":"additional","affiliation":[{"name":"University of Catania,PeRCeiVe Lab,Italy"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Paolo","family":"Spadaro","sequence":"additional","affiliation":[{"name":"University of Catania,PeRCeiVe Lab,Italy"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Simone","family":"Palazzo","sequence":"additional","affiliation":[{"name":"University of Catania,PeRCeiVe Lab,Italy"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Federica Proietto","family":"Salanitri","sequence":"additional","affiliation":[{"name":"University of Catania,PeRCeiVe Lab,Italy"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Giuseppe","family":"Fiameni","sequence":"additional","affiliation":[{"name":"NVIDIA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Efstratios","family":"Gavves","sequence":"additional","affiliation":[{"name":"University of Amsterdam,Informatics Institute,The Netherlands"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Concetto","family":"Spampinato","sequence":"additional","affiliation":[{"name":"University of Catania,PeRCeiVe Lab,Italy"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","article-title":"Scaling laws for neural language models","author":"Kaplan","year":"2020","journal-title":"arXiv preprint arXiv:2001.08361"},{"key":"ref2","article-title":"Attention is all you need","author":"Vaswani","year":"2017","journal-title":"Neurips"},{"key":"ref3","article-title":"Training data-efficient image transformers & distillation through attention","volume-title":"ICML","author":"Touvron"},{"key":"ref4","article-title":"An image is worth 16x16 words: Transformers for image recognition at scale","volume-title":"ICLR","author":"Dosovitskiy"},{"key":"ref5","article-title":"Intriguing properties of vision transformers","author":"Naseer","year":"2021","journal-title":"Neurips"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.4140\/TCP.n.2015.249"},{"key":"ref7","article-title":"Fitnets: Hints for thin deep nets","author":"Romero","year":"2014","journal-title":"arXiv preprint arXiv:1412.6550"},{"key":"ref8","article-title":"Paying more attention to attention: improving the performance of convolutional neural networks via attention transfer","volume-title":"ICLR","author":"Komodakis"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33013779"},{"key":"ref10","article-title":"Transferring inductive biases through knowledge distillation","author":"Abnar","year":"2020","journal-title":"arXiv preprint arXiv:2006.00555"},{"key":"ref11","article-title":"Tinybert: Distilling bert for natural language understanding","author":"Jiao","year":"2019","journal-title":"arXiv preprint arXiv:1909.10351"},{"key":"ref12","article-title":"Distilbert, a distilled version of bert: smaller, faster, cheaper and lighter","author":"Sanh","year":"2019","journal-title":"arXiv preprint arXiv:1910.01108"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-72240-1_21"},{"key":"ref14","article-title":"Learning efficient vision transformers via fine-grained manifold distillation","author":"Hao","year":"2021","journal-title":"Neurips"},{"key":"ref15","article-title":"Transkd: Transformer knowledge distillation for efficient semantic segmentation","author":"Liu","year":"2022","journal-title":"arXiv preprint arXiv:2202.13393"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19803-8_5"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01165"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01420"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00717"},{"key":"ref21","article-title":"Generative pretraining from pixels","volume-title":"ICML","author":"Chen"},{"key":"ref22","article-title":"Zero-shot text-to-image generation","volume-title":"ICML","author":"Ramesh"},{"key":"ref23","article-title":"Understanding the robustness in vision transformers","volume-title":"ICML","author":"Zhou"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19775-8_24"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01173"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.2105.07581"},{"key":"ref27","article-title":"umventing outliers of autoaugment with knowledge distillation","volume-title":"ECCV","author":"Wei"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2021\/362"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0816-y"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01044"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/p19-3007"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00951"}],"event":{"name":"2024 IEEE International Conference on Image Processing (ICIP)","location":"Abu Dhabi, United Arab Emirates","start":{"date-parts":[[2024,10,27]]},"end":{"date-parts":[[2024,10,30]]}},"container-title":["2024 IEEE International Conference on Image Processing (ICIP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10647221\/10647122\/10647295.pdf?arnumber=10647295","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,28]],"date-time":"2024-09-28T05:35:56Z","timestamp":1727501756000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10647295\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,10,27]]},"references-count":32,"URL":"https:\/\/doi.org\/10.1109\/icip51287.2024.10647295","relation":{},"subject":[],"published":{"date-parts":[[2024,10,27]]}}}