{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,1,18]],"date-time":"2025-01-18T05:07:30Z","timestamp":1737176850136,"version":"3.33.0"},"reference-count":57,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,12,15]],"date-time":"2024-12-15T00:00:00Z","timestamp":1734220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,12,15]],"date-time":"2024-12-15T00:00:00Z","timestamp":1734220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,12,15]]},"DOI":"10.1109\/bigdata62323.2024.10826036","type":"proceedings-article","created":{"date-parts":[[2025,1,16]],"date-time":"2025-01-16T18:31:23Z","timestamp":1737052283000},"page":"928-937","source":"Crossref","is-referenced-by-count":0,"title":["OSR-ViT: A Simple and Modular Framework for Open-Set Object Detection and Discovery"],"prefix":"10.1109","author":[{"given":"Matthew","family":"Inkawhich","sequence":"first","affiliation":[{"name":"Duke University,Durham,NC,USA"}]},{"given":"Nathan","family":"Inkawhich","sequence":"additional","affiliation":[{"name":"Air Force Research Laboratory,Rome,NY,USA"}]},{"given":"Hao","family":"Yang","sequence":"additional","affiliation":[{"name":"Johns Hopkins University,Baltimore,MD,USA"}]},{"given":"Jingyang","family":"Zhang","sequence":"additional","affiliation":[{"name":"Duke University,Durham,NC,USA"}]},{"given":"Randolph","family":"Linderman","sequence":"additional","affiliation":[{"name":"Duke University,Durham,NC,USA"}]},{"given":"Yiran","family":"Chen","sequence":"additional","affiliation":[{"name":"Duke University,Durham,NC,USA"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.81"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.169"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2016.2577031"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.91"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58452-8_13"},{"article-title":"Deformable DETR: deformable transformers for end-to-end object detection","volume-title":"International Conference on Learning Representations (ICLR)","author":"Zhu","key":"ref7"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2012.256"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/WACV45572.2020.9093355"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00577"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2018.8460700"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8793821"},{"key":"ref13","article-title":"VOS: learning what you don\u2019t know by virtual outlier synthesis","author":"Du","year":"2022","journal-title":"CoRR"},{"key":"ref14","article-title":"SIREN: shaping representations for detecting out-of-distribution objects","volume-title":"Advances in Neural Information Processing Systems (NeurIPS)","author":"Du","year":"2022"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01331"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2019.2926463"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00252"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19806-9_21"},{"key":"ref19","article-title":"Medical open set recognition via intra-class clustering","volume-title":"Medical Imaging with Deep Learning","author":"Deng","year":"2024"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/WACV57701.2024.00199"},{"key":"ref21","article-title":"Dinov2: Learning robust visual features without supervision","author":"Oquab","year":"2023","journal-title":"CoRR"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-009-0275-4"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2013.253"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298724"},{"key":"ref25","article-title":"Unsupervised object discovery and segmentation of rgbd-images","author":"Ekekrantz","year":"2017","journal-title":"CoRR"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00966"},{"key":"ref27","article-title":"Object-centric learning with slot attention","author":"Locatello","year":"2020","journal-title":"Advances in Neural Information Processing Systems (NeurIPS)"},{"key":"ref28","article-title":"Extending one-stage detection with open-world proposals","author":"Konan","year":"2022","journal-title":"CoRR"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2022.3146922"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20053-3_16"},{"key":"ref31","article-title":"Cascade RPN: delving into high-quality region proposal network with adaptive convolution","volume-title":"Advances in Neural Information Processing Systems (NeurIPS)","author":"Vu","year":"2019"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00308"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2021.3123374"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00937"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1506.02142"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00902"},{"key":"ref37","article-title":"Revisiting open world object detection","author":"Zhao","year":"2022","journal-title":"CoRR"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20080-9_12"},{"article-title":"Objects in semantic topology","volume-title":"International Conference on Learning Representations (ICLR)","author":"Yang","key":"ref39"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP46576.2022.9897461"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1145\/3552458.3556453"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01101"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01416"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20077-9_7"},{"key":"ref45","article-title":"Bridging the gap between object and image-level representations for open-vocabulary detection","volume-title":"Advances in Neural Information Processing Systems (NeurIPS)","author":"Rasheed","year":"2022"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00679"},{"key":"ref47","article-title":"Scaling open-vocabulary object detection","author":"Minderer","year":"2023","journal-title":"CoRR"},{"key":"ref48","article-title":"Energy-based out-of-distribution detection","volume-title":"Advances in Neural Information Processing Systems (NeurIPS)","author":"Liu","year":"2020"},{"key":"ref49","article-title":"A simple unified framework for detecting out-of-distribution samples and adversarial attacks","volume-title":"Advances in Neural Information Processing Systems (NeurIPS)","author":"Lee","year":"2018"},{"article-title":"An image is worth 16x16 words: Transformers for image recognition at scale","volume-title":"International Conference on Learning Representations (ICLR)","author":"Dosovitskiy","key":"ref50"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.322"},{"article-title":"Pseudo-label: The simple and efficient semi-supervised learning method for deep neural networks","year":"2013","author":"Lee","key":"ref52"},{"article-title":"Learning transferable visual models from natural language supervision","volume-title":"International Conference on Machine Learning (ICML)","author":"Radford","key":"ref53"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1405.0312"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00852"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/JSTARS.2021.3104230"},{"key":"ref57","article-title":"Visualizing data using t-sne","volume":"9","author":"van der Maaten","year":"2008","journal-title":"Journal of Machine Learning Research"}],"event":{"name":"2024 IEEE International Conference on Big Data (BigData)","start":{"date-parts":[[2024,12,15]]},"location":"Washington, DC, USA","end":{"date-parts":[[2024,12,18]]}},"container-title":["2024 IEEE International Conference on Big Data (BigData)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10824975\/10824942\/10826036.pdf?arnumber=10826036","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,17]],"date-time":"2025-01-17T07:49:03Z","timestamp":1737100143000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10826036\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,15]]},"references-count":57,"URL":"https:\/\/doi.org\/10.1109\/bigdata62323.2024.10826036","relation":{},"subject":[],"published":{"date-parts":[[2024,12,15]]}}}