{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,21]],"date-time":"2025-11-21T05:51:28Z","timestamp":1763704288409,"version":"3.45.0"},"reference-count":48,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,10,26]],"date-time":"2025-10-26T00:00:00Z","timestamp":1761436800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,10,26]],"date-time":"2025-10-26T00:00:00Z","timestamp":1761436800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,10,26]]},"DOI":"10.1109\/iccad66269.2025.11240696","type":"proceedings-article","created":{"date-parts":[[2025,11,20]],"date-time":"2025-11-20T18:39:34Z","timestamp":1763663974000},"page":"1-9","source":"Crossref","is-referenced-by-count":0,"title":["Opto-ViT: Architecting a Near-Sensor Region of Interest-Aware Vision Transformer Accelerator with Silicon Photonics"],"prefix":"10.1109","author":[{"given":"Mehrdad","family":"Morsali","sequence":"first","affiliation":[{"name":"New Jersey Institute of Technology,USA"}]},{"given":"Chengwei","family":"Zhou","sequence":"additional","affiliation":[{"name":"Case Western Reserve University,USA"}]},{"given":"Deniz","family":"Najafi","sequence":"additional","affiliation":[{"name":"New Jersey Institute of Technology,USA"}]},{"given":"Sreetama","family":"Sarkar","sequence":"additional","affiliation":[{"name":"University of Southern California,USA"}]},{"given":"Pietro","family":"Mercati","sequence":"additional","affiliation":[{"name":"Intel Corporation,USA"}]},{"given":"Navid","family":"Khoshavi","sequence":"additional","affiliation":[{"name":"AMD,USA"}]},{"given":"Peter","family":"Beerel","sequence":"additional","affiliation":[{"name":"University of Southern California,USA"}]},{"given":"Mahdi","family":"Nikdast","sequence":"additional","affiliation":[{"name":"Colorado State University,USA"}]},{"given":"Gourav","family":"Datta","sequence":"additional","affiliation":[{"name":"Case Western Reserve University,USA"}]},{"given":"Shaahin","family":"Angizi","sequence":"additional","affiliation":[{"name":"New Jersey Institute of Technology,USA"}]}],"member":"263","reference":[{"article-title":"A 100,000 fps vision sensor with embedded 535gops\/w 256\u00d7256 simd processor array","volume-title":"Symposium on VLSI","author":"Carey","key":"ref1"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/jssc.2020.3034192"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ISSCC.2017.7870271"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/tcsii.2020.3015902"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/tcsi.2021.3090668"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/JETCAS.2023.3242167"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TETC.2023.3292251"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1038\/s41598-022-17934-1"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/vlsi-soc54400.2022.9939582"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1117\/12.342849"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2022.3179370"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10094902"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00951"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ISCAS46773.2023.10181988"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1145\/3400302.3415640"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1145\/3583781.3590259"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/JSSC.2015.2420678"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/IEDM19573.2019.8993452"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1145\/3476988"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/DAC18074.2021.9586161"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2020.2968184"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.23919\/DATE58400.2024.10546822"},{"article-title":"An image is worth 16x16 words: Transformers for image recognition at scale","volume-title":"International Conference on Learning Representations","author":"Dosovitskiy","key":"ref24"},{"article-title":"Bert: Pre-training of deep bidirectional transformers for language understanding","year":"2019","author":"Devlin","key":"ref25"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.23919\/DATE.2019.8715195"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.23919\/date48585.2020.9116494"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1145\/3287624.3287720"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1145\/3649329.3656261"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1002\/lpor.201100017"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/AICAS59952.2024.10595882"},{"volume-title":"Ncsu eda freepdk45","year":"2011","key":"ref32"},{"year":"2014","key":"ref33","article-title":"Synopsys design compiler, product version 14.9.2014"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/MDAT.2014.2336211"},{"article-title":"Energy-efficient & real-time computer vision with intelligent skipping via reconfigurable CMOS image sensors","year":"2024","author":"Kaiser","key":"ref35"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00286"},{"article-title":"Estimating or propagating gradients through stochastic neurons for conditional computation","year":"2013","author":"Bengio","key":"ref37"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.3389\/fnins.2022.815258"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01565"},{"article-title":"Imagenet-21k pretraining for the masses","year":"2021","author":"Ridnik","key":"ref40"},{"article-title":"Learning multiple layers of features from tiny images","year":"2009","author":"Krizhevsky","key":"ref41"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20077-9_17"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.322"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0816-y"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1145\/3526241.3530364"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/TCAD.2024.3443692"}],"event":{"name":"2025 IEEE\/ACM International Conference On Computer Aided Design (ICCAD)","start":{"date-parts":[[2025,10,26]]},"location":"Munich, Germany","end":{"date-parts":[[2025,10,30]]}},"container-title":["2025 IEEE\/ACM International Conference On Computer Aided Design (ICCAD)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11240608\/11240621\/11240696.pdf?arnumber=11240696","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,21]],"date-time":"2025-11-21T05:43:03Z","timestamp":1763703783000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11240696\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,26]]},"references-count":48,"URL":"https:\/\/doi.org\/10.1109\/iccad66269.2025.11240696","relation":{},"subject":[],"published":{"date-parts":[[2025,10,26]]}}}