{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,25]],"date-time":"2026-05-25T20:07:25Z","timestamp":1779739645013,"version":"3.53.1"},"reference-count":67,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0\/"}],"funder":[{"name":"Horizon Europe High Performance, Safe, Secure, Open-Source Leveraged RISC-V Domain-Specific Ecosystems Project","award":["101112274"],"award-info":[{"award-number":["101112274"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Access"],"published-print":{"date-parts":[[2026]]},"DOI":"10.1109\/access.2026.3694334","type":"journal-article","created":{"date-parts":[[2026,5,18]],"date-time":"2026-05-18T19:47:23Z","timestamp":1779133643000},"page":"75865-75880","source":"Crossref","is-referenced-by-count":0,"title":["MR2-ByteTrack: CNN and Transformer-Based Video Object Detection for AI-Augmented Embedded Vision Sensor Nodes"],"prefix":"10.1109","volume":"14","author":[{"ORCID":"https:\/\/orcid.org\/0009-0002-1277-8584","authenticated-orcid":false,"given":"Luca","family":"Bompani","sequence":"first","affiliation":[{"name":"1Department of Electrical, Electronic, and Information Engineering &#x201C;Guglielmo Marconi&#x201D; (DEI), University of Bologna, Bologna, Italy"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7458-4019","authenticated-orcid":false,"given":"Manuele","family":"Rusci","sequence":"additional","affiliation":[{"name":"2Department of Electrical Engineering (ESAT), KU Leuven, Leuven, Belgium"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8068-3806","authenticated-orcid":false,"given":"Luca","family":"Benini","sequence":"additional","affiliation":[{"name":"1Department of Electrical, Electronic, and Information Engineering &#x201C;Guglielmo Marconi&#x201D; (DEI), University of Bologna, Bologna, Italy"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4487-0836","authenticated-orcid":false,"given":"Daniele","family":"Palossi","sequence":"additional","affiliation":[{"name":"3Integrated Systems Laboratory (IIS), ETH Z&#x00FC;rich, Zurich, Switzerland"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7924-933X","authenticated-orcid":false,"given":"Francesco","family":"Conti","sequence":"additional","affiliation":[{"name":"1Department of Electrical, Electronic, and Information Engineering &#x201C;Guglielmo Marconi&#x201D; (DEI), University of Bologna, Bologna, Italy"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/JSEN.2021.3055618"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1007\/s10462-022-10141-4"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2017.2778504"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/JSEN.2021.3139988"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/JSEN.2023.3240092"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICMCSI61536.2024.00080"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.23919\/DATE56975.2023.10137154"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v36i11.21588"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/JSSC.2021.3114881"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ISCAS51556.2021.9401730"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW63382.2024.00223"},{"key":"ref12","article-title":"An image is worth 16\u00d716 words: Transformers for image recognition at scale","volume-title":"Proc. Int. Conf. Learn. Represent.","author":"Dosovitskiy"},{"issue":"1","key":"ref13","doi-asserted-by":"crossref","first-page":"32","DOI":"10.3390\/technologies13010032","article-title":"Vision transformers for image classification: A comparative survey","volume":"13","author":"Wang","year":"2025","journal-title":"Technologies"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1007\/s10462-023-10595-0"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01587"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0816-y"},{"key":"ref17","volume-title":"Nanodet-Plus Superfast and High Accuracy Lightweight Anchor-Free Object Detection Model","year":"2021"},{"key":"ref18","article-title":"YOLOx: Exceeding YOLO series in 2021","author":"Ge","year":"2021","journal-title":"arXiv:2107.08430"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICUS55513.2022.9986841"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.52"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00931"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01035"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2022.3223955"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i2.25320"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.5220\/0007260000002108"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ISCC53001.2021.9631435"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00640"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00511"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2024.3350380"},{"key":"ref30","article-title":"Looking fast and slow: Memory-guided mobile video object detection","author":"Liu","year":"2019","journal-title":"arXiv:1903.10172"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/JSEN.2024.3425904"},{"key":"ref32","article-title":"Seq-NMS for video object detection","author":"Han","year":"2016","journal-title":"arXiv:1602.08465"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2016.2577031"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00474"},{"key":"ref36","article-title":"What is YOLOv8: An in-depth exploration of the internal features of the next-generation object detector","author":"Yaseen","year":"2024"},{"key":"ref37","first-page":"107984","article-title":"YOLOv10: Real-time end-to-end object detection","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Chen"},{"key":"ref38","article-title":"YOLOv11: An overview of the key architectural enhancements","author":"Khanam","year":"2024","journal-title":"arXiv:2410.17725"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"ref40","article-title":"MobileViT: Light-weight, general-purpose, and mobile-friendly vision transformer","volume-title":"Proc. Int. Conf. Learn. Represent.","author":"Mehta"},{"key":"ref41","article-title":"MobileViTv3: Mobile-friendly vision transformer with simple and effective fusion of local, global and input features","author":"Wadekar","year":"2022","journal-title":"arXiv:2209.15159"},{"key":"ref42","article-title":"Separable self-attention for mobile vision transformers","author":"Mehta","year":"2022","journal-title":"arXiv:2206.02680"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.510"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1016\/j.isprsjprs.2021.04.004"},{"key":"ref45","article-title":"Integrated object detection and tracking with tracklet-conditioned detection","author":"Zhang","year":"2018","journal-title":"arXiv:1811.11167"},{"key":"ref46","article-title":"Deformable DETR: Deformable transformers for end-to-end object detection","author":"Zhu","year":"2020","journal-title":"arXiv:2010.04159"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP.2016.7533003"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20047-2_1"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.23919\/DATE58400.2024.10546577"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2024.3404878"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-91989-3_17"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN60899.2024.10651090"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1145\/3744339"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/COINS51742.2021.9524173"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1109\/TC.2024.3500360"},{"issue":"1","key":"ref56","doi-asserted-by":"crossref","first-page":"8","DOI":"10.3390\/jlpea15010008","article-title":"Optimizing BFloat16 deployment of tiny transformers on ultra-low power extreme edge SoCs","volume":"15","author":"Dequino","year":"2025","journal-title":"J. Low Power Electron. Appl."},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/LCOMM.2023.3303091"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2018.2858826"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA55743.2025.11128029"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1109\/TAFE.2024.3451888"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1145\/3719210"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2004.10934"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2021.3119563"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00900"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1016\/j.cviu.2020.102907"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10602-1_48"}],"container-title":["IEEE Access"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/6287639\/11323511\/11522964.pdf?arnumber=11522964","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,5,25]],"date-time":"2026-05-25T19:55:36Z","timestamp":1779738936000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11522964\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026]]},"references-count":67,"URL":"https:\/\/doi.org\/10.1109\/access.2026.3694334","relation":{},"ISSN":["2169-3536"],"issn-type":[{"value":"2169-3536","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026]]}}}