{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,6]],"date-time":"2026-05-06T07:11:40Z","timestamp":1778051500331,"version":"3.51.4"},"reference-count":56,"publisher":"IEEE","license":[{"start":{"date-parts":[[2026,3,6]],"date-time":"2026-03-06T00:00:00Z","timestamp":1772755200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,3,6]],"date-time":"2026-03-06T00:00:00Z","timestamp":1772755200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026,3,6]]},"DOI":"10.1109\/wacv61042.2026.00832","type":"proceedings-article","created":{"date-parts":[[2026,5,5]],"date-time":"2026-05-05T19:59:32Z","timestamp":1778011172000},"page":"8628-8638","source":"Crossref","is-referenced-by-count":0,"title":["MedROV: Towards Real-Time Open-Vocabulary Detection Across Diverse Medical Imaging Modalities"],"prefix":"10.1109","author":[{"given":"Tooba Tehreem","family":"Sheikh","sequence":"first","affiliation":[{"name":"Mohamed Bin Zayed University of Artificial Intelligence (MBZUAI)"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jean","family":"Lahoud","sequence":"additional","affiliation":[{"name":"Mohamed Bin Zayed University of Artificial Intelligence (MBZUAI)"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Rao Muhammad","family":"Anwer","sequence":"additional","affiliation":[{"name":"Mohamed Bin Zayed University of Artificial Intelligence (MBZUAI)"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Fahad Shahbaz","family":"Khan","sequence":"additional","affiliation":[{"name":"Mohamed Bin Zayed University of Artificial Intelligence (MBZUAI)"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Salman","family":"Khan","sequence":"additional","affiliation":[{"name":"Mohamed Bin Zayed University of Artificial Intelligence (MBZUAI)"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hisham","family":"Cholakkal","sequence":"additional","affiliation":[{"name":"Mohamed Bin Zayed University of Artificial Intelligence (MBZUAI)"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","article-title":"Bccd: Blood cell count and detection","year":"2018"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1016\/j.dib.2019.104863"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1038\/s41467-022-30695-9"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/isbi60581.2025.10980679"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1016\/j.compmedimag.2015.02.007"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TMI.2018.2837502"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2022.102680"},{"key":"ref8","article-title":"Multi-centre multi-vendor & multi-disease cardiac image segmentation challenge (m&ms)","author":"Campello","year":"2020","journal-title":"Medical Image Computing and Computer Assisted Intervention"},{"key":"ref9","article-title":"Meditron-70b: Scaling medical pretraining for large language models","author":"Chen","year":"2023"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01599"},{"key":"ref11","article-title":"Skin lesion analysis toward melanoma detection 2018: A challenge hosted by the international skin imaging collaboration (isic)","author":"Codella","year":"2019"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2022.102485"},{"key":"ref13","article-title":"Totalsegmentator mri: Sequence-independent segmentation of 59 anatomical structures in mr images","author":"D\u2019Antonoli","year":"2024"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2022.102628"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2019.101563"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1016\/j.dib.2023.109662"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.322"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1145\/3730436.3730506"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.3978\/j.issn.2223-4292.2014.11.20"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.52202\/068431-2661"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-72111-3_4"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.7303\/SYN3193805"},{"key":"ref23","first-page":"1","article-title":"Cell segmentation in multi-modality high-resolution microscopy images with cellpose","volume-title":"NeurIPS","author":"Lee","year":"2023"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01069"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-72970-6_3"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA55743.2025.11128145"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1002\/ima.23130"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1002\/mp.14676"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2021.3100536"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2022.102616"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1038\/s41467-024-44824-z"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1201\/b19107-17"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20080-9_42"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/tmi.2018.2865709"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1038\/s41597-024-02984-z"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1016\/j.radonc.2024.110410"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1145\/3083187.3083212"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2019.101561"},{"key":"ref39","article-title":"Abdomenatlas-8k: Annotating 8,000 ct volumes for multi-organ segmentation in three weeks","volume":"36","author":"Qu","year":"2024","journal-title":"NeurIPS"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.91"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2577031"},{"key":"ref42","article-title":"Dino-x: A unified vision model for open-world object detection and understanding","author":"Ren","year":"2024"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1038\/s41591-024-03423-7"},{"issue":"1","key":"ref44","first-page":"1004","article-title":"A comprehensive retinal image dataset for the assessment of glaucoma from the optic nerve head analysis","volume":"2","author":"Sivaswamy","year":"2015","journal-title":"JSM Biomedical Imaging Data Papers"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.02003"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.369"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1148\/ryai.230024.podcast"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-45673-2_15"},{"issue":"2","key":"ref49","article-title":"Cross-scale attention and multi-layer feature fusion yolov8 for skin disease target detection in medical images","volume":"4","author":"Xu","year":"2025","journal-title":"Journal of Computer Technology and Software"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.02586"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20077-9_7"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1056\/aioa2400640"},{"key":"ref53","article-title":"Biomed-parse: a biomedical foundation model for image parsing of everything everywhere all at once","author":"Zhao","year":"2024"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01605"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20077-9_21"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2018.2869576"}],"event":{"name":"2026 IEEE\/CVF Winter Conference on Applications of Computer Vision (WACV)","location":"Tucson, AZ, USA","start":{"date-parts":[[2026,3,6]]},"end":{"date-parts":[[2026,3,10]]}},"container-title":["2026 IEEE\/CVF Winter Conference on Applications of Computer Vision (WACV)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11491838\/11491925\/11492750.pdf?arnumber=11492750","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,5,6]],"date-time":"2026-05-06T06:14:14Z","timestamp":1778048054000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11492750\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,3,6]]},"references-count":56,"URL":"https:\/\/doi.org\/10.1109\/wacv61042.2026.00832","relation":{},"subject":[],"published":{"date-parts":[[2026,3,6]]}}}