{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,6]],"date-time":"2026-04-06T21:09:08Z","timestamp":1775509748499,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":47,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,10,28]],"date-time":"2024-10-28T00:00:00Z","timestamp":1730073600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,10,28]]},"DOI":"10.1145\/3664647.3681372","type":"proceedings-article","created":{"date-parts":[[2024,10,26]],"date-time":"2024-10-26T06:59:49Z","timestamp":1729925989000},"page":"4197-4206","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":2,"title":["Eglcr: Edge Structure Guidance and Scale Adaptive Attention for Iterative Stereo Matching"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0000-0582-2976","authenticated-orcid":false,"given":"Zhien","family":"Dai","sequence":"first","affiliation":[{"name":"School of Automation, Central South University, Changsha, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4132-4987","authenticated-orcid":false,"given":"Zhaohui","family":"Tang","sequence":"additional","affiliation":[{"name":"School of Automation, Central South University, Changsha, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6894-0926","authenticated-orcid":false,"given":"Hu","family":"Zhang","sequence":"additional","affiliation":[{"name":"College of Computer Science and Engineering, Changsha University &amp; School of Mathematics and Statistics, Central South University, Changsha, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6182-3818","authenticated-orcid":false,"given":"Can","family":"Tian","sequence":"additional","affiliation":[{"name":"School of Computer Science and Cyber Engineering, Guangzhou University, Guangzhou, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-8334-3550","authenticated-orcid":false,"given":"Mingjun","family":"Pan","sequence":"additional","affiliation":[{"name":"School of Electronic and Computer Engineering, Peking University, Shenzhen, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2060-6574","authenticated-orcid":false,"given":"Yongfang","family":"Xie","sequence":"additional","affiliation":[{"name":"School of Automation, Central South University, Changsha, China"}]}],"member":"320","published-online":{"date-parts":[[2024,10,28]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00567"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01653"},{"key":"e_1_3_2_1_3_1","first-page":"22158","article-title":"Hierarchical neural architecture search for deep stereo matching","volume":"33","author":"Cheng Xuelian","year":"2020","unstructured":"Xuelian Cheng, Yiran Zhong, Mehrtash Harandi, Yuchao Dai, Xiaojun Chang, Hongdong Li, Tom Drummond, and Zongyuan Ge. 2020. Hierarchical neural architecture search for deep stereo matching. Advances in Neural Information Processing Systems 33 (2020), 22158--22169.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1109\/3DV.2019.00010"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"crossref","unstructured":"Yang et al. 2022. Edge supervision and multi-scale cost volume for stereo matching. Image and Vision Computing (2022).","DOI":"10.1016\/j.imavis.2021.104336"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00339"},{"key":"e_1_3_2_1_8_1","volume-title":"Proceedings, Part VII 13","author":"Gupta Saurabh","year":"2014","unstructured":"Saurabh Gupta, Ross Girshick, Pablo Arbel\u00e1ez, and Jitendra Malik. 2014. Learning rich features from RGB-D images for object detection and segmentation. In Computer Vision--ECCV 2014: 13th European Conference, Zurich, Switzerland, September 6--12, 2014, Proceedings, Part VII 13. Springer, 345--360."},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2005.56"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP42928.2021.9506469"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.17"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2013.6631104"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR.2006.1033"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2001.937668"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01578"},{"key":"e_1_3_2_1_16_1","volume-title":"Stereo matching using multi-level cost","author":"Liang Zhengfa","year":"2019","unstructured":"Zhengfa Liang, Yulan Guo, Yiliu Feng, Wei Chen, Linbo Qiao, Li Zhou, Jianfeng Zhang, and Hengzhu Liu. 2019. Stereo matching using multi-level cost volume and multi-scale feature constancy. IEEE transactions on pattern analysis and machine intelligence 43, 1 (2019), 300--315."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1109\/3DV53792.2021.00032"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v36i2.20056"},{"key":"e_1_3_2_1_19_1","volume-title":"Decoupled weight decay regularization. arXiv preprint arXiv:1711.05101","author":"Loshchilov Ilya","year":"2017","unstructured":"Ilya Loshchilov and Frank Hutter. 2017. Decoupled weight decay regularization. arXiv preprint arXiv:1711.05101 (2017)."},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2023.3260901"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.438"},{"key":"e_1_3_2_1_22_1","volume-title":"Joint 3d estimation of vehicles and scene flow. ISPRS annals of the photogrammetry, remote sensing and spatial information sciences 2","author":"Menze Moritz","year":"2015","unstructured":"Moritz Menze, Christian Heipke, and Andreas Geiger. 2015. Joint 3d estimation of vehicles and scene flow. ISPRS annals of the photogrammetry, remote sensing and spatial information sciences 2 (2015), 427."},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00474"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-11752-2_3"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.272"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01369"},{"key":"e_1_3_2_1_27_1","volume-title":"PCW-Net: Pyramid Combination and Warping Cost","author":"Shen Zhelun","year":"2022","unstructured":"Zhelun Shen, Yuchao Dai, Xibin Song, Zhibo Rao, Dingfu Zhou, and Liangjun Zhang. 2022. PCW-Net: Pyramid Combination and Warping Cost Volume for Stereo Matching. In European Conference on Computer Vision(ECCV)."},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01019"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-019-01287-w"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01413"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00841"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"crossref","unstructured":"Philippe Weinzaepfel Thomas Lucas Vincent Leroy Yohann Cabon Vaibhav Arora Romain Br\u00e9gier Gabriela Csurka Leonid Antsfeld Boris Chidlovskii and J\u00e9r\u00f4me Revaud. 2023. CroCo v2: Improved Cross-view Completion Pre-training for Stereo Matching and Optical Flow. In ICCV.","DOI":"10.1109\/ICCV51070.2023.01647"},{"key":"e_1_3_2_1_33_1","volume-title":"Proceedings of the IEEE\/CVF international conference on computer vision. 7484--7493","author":"Zhang Xiaoping","year":"2019","unstructured":"ZhenyaoWu, XinyiWu, Xiaoping Zhang, SongWang, and Lili Ju. 2019. Semantic stereo matching with pyramid cost volumes. In Proceedings of the IEEE\/CVF international conference on computer vision. 7484--7493."},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01231"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01264"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.02099"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00203"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2023.3298645"},{"key":"e_1_3_2_1_39_1","volume-title":"Proceedings of the AAAI Conference on Artificial Intelligence","volume":"35","author":"Xu Hongbin","year":"2021","unstructured":"Hongbin Xu, Zhipeng Zhou, Yu Qiao, Wenxiong Kang, and Qiuxia Wu. 2021. Self-supervised multi-view stereo via effective co-segmentation and dataaugmentation. In Proceedings of the AAAI Conference on Artificial Intelligence, Vol. 35. 3030--3038."},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00566"},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00744"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00603"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00027"},{"key":"e_1_3_2_1_44_1","volume-title":"Domain-invariant Stereo Matching Networks. In Europe Conference on Computer Vision (ECCV).","author":"Zhang Feihu","year":"2020","unstructured":"Feihu Zhang, Xiaojuan Qi, Ruigang Yang, Victor Prisacariu, Benjamin Wah, and Philip Torr. 2020. Domain-invariant Stereo Matching Networks. In Europe Conference on Computer Vision (ECCV)."},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2009.2020478"},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00134"},{"key":"e_1_3_2_1_47_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00872"}],"event":{"name":"MM '24: The 32nd ACM International Conference on Multimedia","location":"Melbourne VIC Australia","acronym":"MM '24","sponsor":["SIGMM ACM Special Interest Group on Multimedia"]},"container-title":["Proceedings of the 32nd ACM International Conference on Multimedia"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3664647.3681372","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3664647.3681372","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T01:17:44Z","timestamp":1750295864000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3664647.3681372"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,10,28]]},"references-count":47,"alternative-id":["10.1145\/3664647.3681372","10.1145\/3664647"],"URL":"https:\/\/doi.org\/10.1145\/3664647.3681372","relation":{},"subject":[],"published":{"date-parts":[[2024,10,28]]},"assertion":[{"value":"2024-10-28","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}