{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,24]],"date-time":"2026-02-24T17:23:06Z","timestamp":1771953786219,"version":"3.50.1"},"reference-count":51,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,6]]},"DOI":"10.1109\/cvpr.2018.00040","type":"proceedings-article","created":{"date-parts":[[2018,12,18]],"date-time":"2018-12-18T01:49:37Z","timestamp":1545097777000},"page":"311-320","source":"Crossref","is-referenced-by-count":172,"title":["Monocular Relative Depth Perception with Web Stereo Data Supervision"],"prefix":"10.1109","author":[{"given":"Ke","family":"Xian","sequence":"first","affiliation":[]},{"given":"Chunhua","family":"Shen","sequence":"additional","affiliation":[]},{"given":"Zhiguo","family":"Cao","sequence":"additional","affiliation":[]},{"given":"Hao","family":"Lu","sequence":"additional","affiliation":[]},{"given":"Yang","family":"Xiao","sequence":"additional","affiliation":[]},{"given":"Ruibo","family":"Li","sequence":"additional","affiliation":[]},{"given":"Zhenbo","family":"Luo","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","first-page":"1","article-title":"Quasi-euclidean uncalibrated epipolar rectification","author":"fusiello","year":"2008","journal-title":"Proc IEEE Int Conf Patt Recogn"},{"key":"ref38","article-title":"Stereo matching by training a convolutional neural network to compare image patches","volume":"17","author":"zbontar","year":"2016","journal-title":"J Mach Learn Res"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.52"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.595"},{"key":"ref31","article-title":"Unsuper-vised learning of depth and ego-motion from video","author":"zhou","year":"2017","journal-title":"Proc IEEE Conf Comp Vis Patt Recogn"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.699"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2007.1166"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.638"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.173"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1145\/1273496.1273513"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/3DV.2016.69"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.304"},{"key":"ref29","article-title":"Unsupervised cnn for single view depth estimation: Geometry to the rescue","author":"garg","year":"2016","journal-title":"In Proc European Conf Comp Vis"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/3DV.2016.32"},{"key":"ref1","article-title":"Depth map prediction from a single image using a multi-scale deep network","author":"eigen","year":"2014","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref20","article-title":"Estimating depth from monocular images as classification using deep fully convolutional residual networks","author":"cao","year":"2017","journal-title":"IEEE Trans Circuits Syst Video Technol"},{"key":"ref22","article-title":"Depth and surface normal estimation from monocular images using regression on deep features and hierarchical crfs","author":"li","year":"2015","journal-title":"Proc IEEE Conf Comp Vis Patt Recogn"},{"key":"ref21","article-title":"Unified depth prediction and intrinsic image decomposition from a single image via joint convolutional neural fields","author":"kim","year":"2016","journal-title":"In Proc European Conf Comp Vis"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298897"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.25"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298635"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.19"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1145\/2733373.2807412"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2011.6126343"},{"key":"ref10","article-title":"Indoor segmentation and support inference from rgbd images","author":"silberman","year":"2012","journal-title":"Proc Eur Conf Comp Vis"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2008.132"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.549"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2010.5539823"},{"key":"ref13","article-title":"Learning depth from single monocular images","author":"saxena","year":"2005","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2015.2495261"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.401"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2013.2270375"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.97"},{"key":"ref18","first-page":"1097","article-title":"Imagenet classification with deep convolutional neural networks","author":"krizhevsky","year":"2012","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2015.2505283"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.594"},{"key":"ref6","article-title":"Single-image depth perception in the wild","author":"chen","year":"2016","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref5","article-title":"Depth from a single image by harmonizing overcomplete local network predictions","author":"chakrabarti","year":"2016","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref8","article-title":"Break ames room illusion: Depth from general single images","author":"shi","year":"2015","journal-title":"Ann ACM SIGIR Asia Con!"},{"key":"ref7","doi-asserted-by":"crossref","DOI":"10.1109\/TPAMI.2014.2316835","article-title":"Depthtransfer: Depth extraction from video using non-parametric sampling","author":"karsch","year":"2014","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.179"},{"key":"ref46","author":"chen","year":"2016","journal-title":"Deeplab Semantic image segmentation with deep convolutional nets atrous convolution and fully connected crfs"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.660"},{"key":"ref48","author":"wang","year":"2017","journal-title":"Understanding convolution for semantic segmentation"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.106"},{"key":"ref42","first-page":"513","article-title":"Parameter learning and convergent inference for dense random fields","author":"kr\u00e4henb\u00fchl","year":"2013","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.544"},{"key":"ref44","author":"uhrig","year":"0","journal-title":"Sparsity invariant CNNs"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.458"}],"event":{"name":"2018 IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","location":"Salt Lake City, UT","start":{"date-parts":[[2018,6,18]]},"end":{"date-parts":[[2018,6,23]]}},"container-title":["2018 IEEE\/CVF Conference on Computer Vision and Pattern Recognition"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8576498\/8578098\/08578138.pdf?arnumber=8578138","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,1,26]],"date-time":"2022-01-26T23:37:07Z","timestamp":1643240227000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8578138\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,6]]},"references-count":51,"URL":"https:\/\/doi.org\/10.1109\/cvpr.2018.00040","relation":{},"subject":[],"published":{"date-parts":[[2018,6]]}}}