{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T05:05:18Z","timestamp":1750309518945,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":31,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,10,25]],"date-time":"2024-10-25T00:00:00Z","timestamp":1729814400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,10,25]]},"DOI":"10.1145\/3704323.3705010","type":"proceedings-article","created":{"date-parts":[[2025,1,7]],"date-time":"2025-01-07T08:25:22Z","timestamp":1736238322000},"page":"74-80","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Monocular Depth Estimation Using Differential Scale Features and Log-Remapping Depth Guidance"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0009-5992-640X","authenticated-orcid":false,"given":"Xiaoxia","family":"Ou","sequence":"first","affiliation":[{"name":"Control science and engineering, South China University of Technology, Guangzhou, Guangdong, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2263-6953","authenticated-orcid":false,"given":"Yuxiang","family":"Wu","sequence":"additional","affiliation":[{"name":"Control science and engineering, South China University of Technology, Guangzhou, Guangdong, China"}]}],"member":"320","published-online":{"date-parts":[[2025,1,7]]},"reference":[{"key":"e_1_3_3_1_2_2","unstructured":"Ashutosh Agarwal and Chetan Arora. 2022. Attention Attention Everywhere: Monocular Depth Prediction with Skip Attention. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2210.09071 (2022)."},{"key":"e_1_3_3_1_3_2","first-page":"6799","volume-title":"Proceedings of the IEEE conference on computer vision and pattern recognition","author":"Alp\u00a0Guler Riza","year":"2017","unstructured":"Riza Alp\u00a0Guler, George Trigeorgis, Epameinondas Antonakos, Patrick Snape, Stefanos Zafeiriou, and Iasonas Kokkinos. 2017. Densereg: Fully convolutional dense shape regression in-the-wild. In Proceedings of the IEEE conference on computer vision and pattern recognition. 6799\u20136808."},{"key":"e_1_3_3_1_4_2","first-page":"4009","volume-title":"Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition","author":"Bhat Shariq\u00a0Farooq","year":"2021","unstructured":"Shariq\u00a0Farooq Bhat, Ibraheem Alhashim, and Peter Wonka. 2021. Adabins: Depth estimation using adaptive bins. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition. 4009\u20134018."},{"key":"e_1_3_3_1_5_2","doi-asserted-by":"crossref","unstructured":"Yuanzhouhan Cao Zifeng Wu and Chunhua Shen. 2017. Estimating depth from monocular images as classification using deep fully convolutional residual networks. IEEE Transactions on Circuits and Systems for Video Technology 28 11 (2017) 3174\u20133182.","DOI":"10.1109\/TCSVT.2017.2740321"},{"key":"e_1_3_3_1_6_2","doi-asserted-by":"crossref","unstructured":"Liang-Chieh Chen George Papandreou Iasonas Kokkinos Kevin Murphy and Alan\u00a0L Yuille. 2017. Deeplab: Semantic image segmentation with deep convolutional nets atrous convolution and fully connected crfs. IEEE transactions on pattern analysis and machine intelligence 40 4 (2017) 834\u2013848.","DOI":"10.1109\/TPAMI.2017.2699184"},{"key":"e_1_3_3_1_7_2","unstructured":"David Eigen Christian Puhrsch and Rob Fergus. 2014. Depth map prediction from a single image using a multi-scale deep network. Advances in neural information processing systems 27 (2014)."},{"key":"e_1_3_3_1_8_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00214"},{"key":"e_1_3_3_1_9_2","doi-asserted-by":"publisher","DOI":"10.5555\/2354409.2354978"},{"key":"e_1_3_3_1_10_2","unstructured":"Andrew\u00a0G Howard Menglong Zhu Bo Chen Dmitry Kalenichenko Weijun Wang Tobias Weyand Marco Andreetto and Hartwig Adam. 2017. Mobilenets: Efficient convolutional neural networks for mobile vision applications. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/1704.04861 (2017)."},{"key":"e_1_3_3_1_11_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00745"},{"key":"e_1_3_3_1_12_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.243"},{"key":"e_1_3_3_1_13_2","unstructured":"Diederik\u00a0P Kingma and Jimmy Ba. 2014. Adam: A method for stochastic optimization. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/1412.6980 (2014)."},{"key":"e_1_3_3_1_14_2","doi-asserted-by":"publisher","DOI":"10.1109\/3DV.2016.32"},{"key":"e_1_3_3_1_15_2","unstructured":"Jin\u00a0Han Lee Myung-Kyu Han Dong\u00a0Wook Ko and Il\u00a0Hong Suh. 2019. From big to small: Multi-scale local planar guidance for monocular depth estimation. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/1907.10326 (2019)."},{"key":"e_1_3_3_1_16_2","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i3.16282"},{"key":"e_1_3_3_1_17_2","first-page":"1119","volume-title":"Proceedings of the IEEE conference on computer vision and pattern recognition","author":"Li Bo","year":"2015","unstructured":"Bo Li, Chunhua Shen, Yuchao Dai, Anton Van Den\u00a0Hengel, and Mingyi He. 2015. Depth and surface normal estimation from monocular images using regression on deep features and hierarchical crfs. In Proceedings of the IEEE conference on computer vision and pattern recognition. 1119\u20131127."},{"key":"e_1_3_3_1_18_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.365"},{"key":"e_1_3_3_1_19_2","doi-asserted-by":"crossref","unstructured":"Zhenyu Li Zehui Chen Xianming Liu and Junjun Jiang. 2023. DepthFormer: Exploiting Long-range Correlation and Local Information for Accurate Monocular Depth Estimation. Machine Intelligence Research 20 6 (2023) 837\u2013854.","DOI":"10.1007\/s11633-023-1458-0"},{"key":"e_1_3_3_1_20_2","unstructured":"Zhenyu Li Xuyang Wang Xianming Liu and Junjun Jiang. 2022. BinsFormer: Revisiting Adaptive Bins for Monocular Depth Estimation. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2204.00987 (2022)."},{"key":"e_1_3_3_1_21_2","unstructured":"Ce Liu Suryansh Kumar Shuhang Gu Radu Timofte and Luc\u00a0Van Gool. 2023. VA-DepthNet: A Variational Approach to Single Image Depth Prediction. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2302.06556 (2023)."},{"key":"e_1_3_3_1_22_2","doi-asserted-by":"crossref","unstructured":"Fayao Liu Chunhua Shen Guosheng Lin and Ian Reid. 2015. Learning depth from single monocular images using deep convolutional neural fields. IEEE transactions on pattern analysis and machine intelligence 38 10 (2015) 2024\u20132039.","DOI":"10.1109\/TPAMI.2015.2505283"},{"key":"e_1_3_3_1_23_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"e_1_3_3_1_24_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01261"},{"key":"e_1_3_3_1_25_2","unstructured":"Adam Paszke Sam Gross Francisco Massa Adam Lerer James Bradbury Gregory Chanan Trevor Killeen Zeming Lin Natalia Gimelshein Luca Antiga et\u00a0al. 2019. Pytorch: An imperative style high-performance deep learning library. Advances in neural information processing systems 32 (2019)."},{"key":"e_1_3_3_1_26_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01196"},{"key":"e_1_3_3_1_27_2","doi-asserted-by":"crossref","unstructured":"Shuwei Shao Ran Li Zhongcai Pei Zhong Liu Weihai Chen Wentao Zhu Xingming Wu and Baochang Zhang. 2022. Towards comprehensive monocular depth estimation: Multiple heads are better than one. IEEE Transactions on Multimedia (2022).","DOI":"10.1109\/TMM.2022.3224810"},{"key":"e_1_3_3_1_28_2","doi-asserted-by":"crossref","unstructured":"Shuwei Shao Zhongcai Pei Xingming Wu Zhong Liu Weihai Chen and Zhengguo Li. 2023. IEBins: Iterative Elastic Bins for Monocular Depth Estimation. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2309.14137 (2023).","DOI":"10.1007\/s11263-024-02293-3"},{"key":"e_1_3_3_1_29_2","doi-asserted-by":"crossref","unstructured":"Minsoo Song Seokjae Lim and Wonjun Kim. 2021. Monocular depth estimation using laplacian pyramid-based depth residuals. IEEE transactions on circuits and systems for video technology 31 11 (2021) 4381\u20134393.","DOI":"10.1109\/TCSVT.2021.3049869"},{"key":"e_1_3_3_1_30_2","doi-asserted-by":"crossref","unstructured":"Xianfa Xu Zhe Chen and Fuliang Yin. 2021. Monocular depth estimation with multi-scale feature fusion. IEEE Signal Processing Letters 28 (2021) 678\u2013682.","DOI":"10.1109\/LSP.2021.3067498"},{"key":"e_1_3_3_1_31_2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01596"},{"key":"e_1_3_3_1_32_2","doi-asserted-by":"crossref","unstructured":"Weihao Yuan Xiaodong Gu Zuozhuo Dai Siyu Zhu and Ping Tan. 2022. NeW CRFs: Neural Window Fully-connected CRFs for Monocular Depth Estimation. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2203.01502 (2022).","DOI":"10.1109\/CVPR52688.2022.00389"}],"event":{"name":"ICCPR 2024: 2024 13th International Conference on Computing and Pattern Recognition","acronym":"ICCPR 2024","location":"Tianjin China"},"container-title":["Proceedings of the 2024 13th International Conference on Computing and Pattern Recognition"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3704323.3705010","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3704323.3705010","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T01:18:05Z","timestamp":1750295885000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3704323.3705010"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,10,25]]},"references-count":31,"alternative-id":["10.1145\/3704323.3705010","10.1145\/3704323"],"URL":"https:\/\/doi.org\/10.1145\/3704323.3705010","relation":{},"subject":[],"published":{"date-parts":[[2024,10,25]]},"assertion":[{"value":"2025-01-07","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}