{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,30]],"date-time":"2024-10-30T00:10:24Z","timestamp":1730247024753,"version":"3.28.0"},"reference-count":37,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,10,27]],"date-time":"2024-10-27T00:00:00Z","timestamp":1729987200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,10,27]],"date-time":"2024-10-27T00:00:00Z","timestamp":1729987200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,10,27]]},"DOI":"10.1109\/icip51287.2024.10647455","type":"proceedings-article","created":{"date-parts":[[2024,9,27]],"date-time":"2024-09-27T18:34:45Z","timestamp":1727462085000},"page":"2142-2148","source":"Crossref","is-referenced-by-count":0,"title":["Efficient Visual Question Answering on Embedded Devices: Cross-Modality Attention With Evolutionary Quantization"],"prefix":"10.1109","author":[{"given":"Aakansha","family":"Mishra","sequence":"first","affiliation":[{"name":"Samsung Research Institute,Bangalore"}]},{"given":"Aditya","family":"Agarwala","sequence":"additional","affiliation":[{"name":"Samsung Research Institute,Bangalore"}]},{"given":"Utsav","family":"Tiwari","sequence":"additional","affiliation":[{"name":"Samsung Research Institute,Bangalore"}]},{"given":"Vikram N","family":"Rajendiran","sequence":"additional","affiliation":[{"name":"Samsung Research Institute,Bangalore"}]},{"given":"Srinivas S","family":"Miriyala","sequence":"additional","affiliation":[{"name":"Samsung Research Institute,Bangalore"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.3390\/bioengineering10030380"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01008"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.4018\/JOEUC.347914"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.279"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46478-7_28"},{"key":"ref6","article-title":"Show, ask, attend, and answer: A strong baseline for visual question answering","author":"Kazemi","year":"2017","journal-title":"arXiv preprint arXiv:1704.03162"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00636"},{"key":"ref8","article-title":"Learning to count objects in natural images for visual question answering","author":"Zhang","year":"2018","journal-title":"arXiv preprint arXiv:1802.05766"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1514"},{"key":"ref10","article-title":"Attention is all you need","author":"Vaswani","year":"2017","journal-title":"Advances in neural information processing systems, 30"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01046"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.emnlp-main.627"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.findings-emnlp.489"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TCAD.2023.3347291"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.499"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.10"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58577-8_7"},{"key":"ref18","article-title":"Blip-2: Bootstrapping language-image pre-training with frozen image encoders and large language models","author":"Li","year":"2023","journal-title":"arXiv preprint arXiv:2301.12597"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01438"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICSCDS56580.2023.10104870"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i9.26255"},{"key":"ref22","article-title":"LXMERT Model Compression for Visual Question Answering","author":"Hashemi","year":"2023","journal-title":"arXiv preprint arXiv:2310.15325"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/3534619"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v36i10.21316"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2023.3254205"},{"key":"ref26","first-page":"8470","article-title":"POP-VQAPrivacy Preserving, On-Device, Personalized Visual Question Answering","volume-title":"Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision","author":"Sahu"},{"key":"ref27","article-title":"A white paper on neural network quantization","author":"Nagel","year":"2021","journal-title":"arXiv preprint arXiv:2106.08295"},{"key":"ref28","article-title":"Faster r-cnn: Towards real-time object detection with region proposal networks","volume":"28","author":"Ren","year":"2015","journal-title":"Advances in neural information processing systems"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1162"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-30504-7_8"},{"journal-title":"onnxruntime.ai","key":"ref31","article-title":"ONNX Runtime Home"},{"volume-title":"Snapdragon Neural Processing Engine SDK","key":"ref32"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.670"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00680"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/iccv.2019.00592"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/TAI.2022.3160418"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2023.109848"}],"event":{"name":"2024 IEEE International Conference on Image Processing (ICIP)","start":{"date-parts":[[2024,10,27]]},"location":"Abu Dhabi, United Arab Emirates","end":{"date-parts":[[2024,10,30]]}},"container-title":["2024 IEEE International Conference on Image Processing (ICIP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10647221\/10647122\/10647455.pdf?arnumber=10647455","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,28]],"date-time":"2024-09-28T05:36:28Z","timestamp":1727501788000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10647455\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,10,27]]},"references-count":37,"URL":"https:\/\/doi.org\/10.1109\/icip51287.2024.10647455","relation":{},"subject":[],"published":{"date-parts":[[2024,10,27]]}}}