{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,21]],"date-time":"2026-05-21T10:40:00Z","timestamp":1779360000385,"version":"3.51.4"},"reference-count":84,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,5,29]],"date-time":"2023-05-29T00:00:00Z","timestamp":1685318400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,5,29]],"date-time":"2023-05-29T00:00:00Z","timestamp":1685318400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,5,29]]},"DOI":"10.1109\/icra48891.2023.10161471","type":"proceedings-article","created":{"date-parts":[[2023,7,4]],"date-time":"2023-07-04T17:20:56Z","timestamp":1688491256000},"page":"3116-3123","source":"Crossref","is-referenced-by-count":46,"title":["UDepth: Fast Monocular Depth Estimation for Visually-guided Underwater Robots"],"prefix":"10.1109","author":[{"given":"Boxiao","family":"Yu","sequence":"first","affiliation":[{"name":"University of Florida,Robot Perception and Intelligence (RoboPI) laboratory,Electrical and Computer Engineering (ECE) department,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jiayi","family":"Wu","sequence":"additional","affiliation":[{"name":"University of Florida,Robot Perception and Intelligence (RoboPI) laboratory,Electrical and Computer Engineering (ECE) department,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Md Jahidul","family":"Islam","sequence":"additional","affiliation":[{"name":"University of Florida,Robot Perception and Intelligence (RoboPI) laboratory,Electrical and Computer Engineering (ECE) department,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1177\/0278364913507325"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00043"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2012.6385685"},{"key":"ref56","first-page":"817","article-title":"Deep virtual stereo odometry: Leveraging deep depth prediction for monocular direct sparse odometry","author":"yang","year":"2018","journal-title":"Proceedings of the European Conference on Computer Vision (ECCV)"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1364\/OE.23.033911"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00024"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1007\/s10514-021-09985-6"},{"key":"ref58","doi-asserted-by":"crossref","first-page":"1606","DOI":"10.1109\/TIP.2019.2944343","article-title":"Unsupervised monocular depth estimation from light field image","volume":"29","author":"zhou","year":"2019","journal-title":"IEEE Transactions on Image Processing"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00256"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/3DV.2018.00045"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TMECH.2019.2929652"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2021.3120670"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2017.2690455"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1016\/j.image.2019.07.007"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/OCEANSKOBE.2018.8559463"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.3390\/s151229864"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1049\/iet-ipr.2019.1533"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP.2015.7351749"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00225"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.700"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00069"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2017.2740321"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/TETCI.2022.3209306"},{"key":"ref47","first-page":"785","article-title":"Multi-loss rebalancing algorithm for monoc-ular depth estimation","author":"lee","year":"2020","journal-title":"European Conference on Computer Vision"},{"key":"ref42","article-title":"Attention is All You Need","volume":"30","author":"vaswani","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.304"},{"key":"ref44","article-title":"The berhu penalty and the grouped effect","author":"zwald","year":"2012","journal-title":"ArXiv Preprint"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01196"},{"key":"ref49","first-page":"740","article-title":"Unsupervised cnn for single view depth estimation: Geometry to the rescue","author":"garg","year":"2016","journal-title":"European Conference on Computer Vision"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/JSTARS.2021.3100395"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00703"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.23919\/OCEANS.2013.6741175"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1002\/rob.21771"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/IROS45743.2020.9340919"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/IROS40897.2019.8967703"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA40945.2020.9197558"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00403"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2012.213"},{"key":"ref40","article-title":"Depth map prediction from a single image using a multi-scale deep network","volume":"27","author":"eigen","year":"2014","journal-title":"Advances in neural information processing systems"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2019.2955241"},{"key":"ref83","doi-asserted-by":"crossref","DOI":"10.15607\/RSS.2022.XVIII.048","article-title":"SVAM: Saliency-guided Visual Attention Modeling by Autonomous Underwater Robots","author":"islam","year":"2022","journal-title":"Robotics Science and Systems (RSS)"},{"key":"ref80","article-title":"Decoupled weight decay regularization","author":"loshchilov","year":"2017","journal-title":"ArXiv Preprint"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00214"},{"key":"ref79","article-title":"Pytorch: An imperative style, high-performance deep learning library","volume":"32","author":"paszke","year":"2019","journal-title":"Advances in neural information processing systems"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1007\/s11431-020-1582-8"},{"key":"ref78","article-title":"An image is worth 16&#x00D7;16 words: Transformers for image recognition at scale","author":"dosovitskiy","year":"2020","journal-title":"ArXiv Preprint"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00399"},{"key":"ref36","article-title":"Towards robust monocular depth estimation: Mixing datasets for zero-shot cross-dataset transfer","author":"ranftl","year":"2020","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00178"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.1109\/3DV.2016.32"},{"key":"ref30","author":"hong","year":"2022","journal-title":"USOD10K A New Benchmark Dataset for Underwater Salient Object Detection"},{"key":"ref74","article-title":"Very deep convolutional networks for large-scale image recognition","author":"simonyan","year":"2014","journal-title":"ArXiv Preprint"},{"key":"ref33","first-page":"270","article-title":"Unsupervised monocu-lar depth estimation with left-right consistency","author":"godard","year":"2017","journal-title":"Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00474"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00393"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2020.2974710"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/WACV.2016.7477644"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.365"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00042"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2017.2759252"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1016\/j.jvcir.2014.11.006"},{"key":"ref73","first-page":"234","article-title":"U-Net: Convolutional Networks for Biomedical Image Segmentation","author":"ronneberger","year":"2015","journal-title":"International Conference on Medical image computing and computer-assisted inter-vention"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8794272"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.3389\/fmars.2021.690962"},{"key":"ref68","first-page":"2341","article-title":"Single Image Haze Removal using Dark Channel Prior","volume":"33","author":"he","year":"2010","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2019.2958950"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1109\/ICInfA.2013.6720385"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1155\/2021\/6644986"},{"key":"ref25","doi-asserted-by":"crossref","first-page":"3268","DOI":"10.3390\/s21093268","article-title":"Unpaired underwater image synthesis with a disentangled representation for underwater depth map prediction","volume":"21","author":"zhao","year":"2021","journal-title":"SENSORS"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1109\/MCG.2016.26"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/JOE.2018.2865045"},{"key":"ref64","article-title":"A large rgb-d dataset for semi-supervised monocular depth estimation","author":"cho","year":"2019","journal-title":"ArXiv Preprint"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA46639.2022.9811802"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/TIM.2021.3120130"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1109\/OCEANSE.2017.8084665"},{"key":"ref21","first-page":"678","article-title":"A rapid scene depth estimation model based on underwater light attenuation prior for underwater image restoration","author":"song","year":"2018","journal-title":"Pacific Rim Conference on Multimedia"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1109\/MCG.2016.26"},{"key":"ref28","first-page":"4009","article-title":"Adabins: Depth estimation using adaptive bins","author":"bhat","year":"2021","journal-title":"Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP.2019.8804200"},{"key":"ref29","article-title":"High quality monocular depth estimation via transfer learning","author":"alhashim","year":"2018","journal-title":"ArXiv Preprint"},{"key":"ref60","first-page":"484","article-title":"Learning monocular depth by distilling cross-domain stereo networks","author":"guo","year":"2018","journal-title":"Proceedings of the European Conference on Computer Vision (ECCV)"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1109\/ROBIO49542.2019.8961504"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.238"}],"event":{"name":"2023 IEEE International Conference on Robotics and Automation (ICRA)","location":"London, United Kingdom","start":{"date-parts":[[2023,5,29]]},"end":{"date-parts":[[2023,6,2]]}},"container-title":["2023 IEEE International Conference on Robotics and Automation (ICRA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10160211\/10160212\/10161471.pdf?arnumber=10161471","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,7,24]],"date-time":"2023-07-24T17:32:28Z","timestamp":1690219948000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10161471\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,5,29]]},"references-count":84,"URL":"https:\/\/doi.org\/10.1109\/icra48891.2023.10161471","relation":{},"subject":[],"published":{"date-parts":[[2023,5,29]]}}}