{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,20]],"date-time":"2026-03-20T15:47:06Z","timestamp":1774021626151,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":49,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,8,10]]},"DOI":"10.1145\/3721238.3730659","type":"proceedings-article","created":{"date-parts":[[2025,7,23]],"date-time":"2025-07-23T08:40:47Z","timestamp":1753260047000},"page":"1-11","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":1,"title":["Monocular Online Reconstruction with Enhanced Detail Preservation"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0009-9581-2506","authenticated-orcid":false,"given":"Songyin","family":"Wu","sequence":"first","affiliation":[{"name":"Meta Reality Labs Research, Seattle, USA and University of California Santa Barbara, Santa Barbara, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7788-9982","authenticated-orcid":false,"given":"Zhaoyang","family":"Lv","sequence":"additional","affiliation":[{"name":"Meta Reality Labs Research, San Francisco, USA"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-8716-201X","authenticated-orcid":false,"given":"Yufeng","family":"Zhu","sequence":"additional","affiliation":[{"name":"Meta Reality Labs Research, Seattle, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5948-3452","authenticated-orcid":false,"given":"Duncan","family":"Frost","sequence":"additional","affiliation":[{"name":"Meta Reality Labs Research, London, United Kingdom"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0868-2141","authenticated-orcid":false,"given":"Zhengqin","family":"Li","sequence":"additional","affiliation":[{"name":"Meta Reality Labs Research, Seattle, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9379-094X","authenticated-orcid":false,"given":"Ling-Qi","family":"Yan","sequence":"additional","affiliation":[{"name":"University of California Santa Barbara, Santa Barbara, USA"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-0942-2929","authenticated-orcid":false,"given":"Carl","family":"Ren","sequence":"additional","affiliation":[{"name":"Meta Reality Labs Research, Seattle, USA"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-9091-8989","authenticated-orcid":false,"given":"Richard","family":"Newcombe","sequence":"additional","affiliation":[{"name":"Meta Reality Labs Research, Seattle, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9026-6886","authenticated-orcid":false,"given":"Zhao","family":"Dong","sequence":"additional","affiliation":[{"name":"Meta Reality Labs Research, Seattle, USA"}]}],"member":"320","published-online":{"date-parts":[[2025,7,27]]},"reference":[{"key":"e_1_3_3_2_2_1","unstructured":"Lizhi Bai Chunqi Tian Jun Yang Siyu Zhang Masanori Suganuma and Takayuki Okatani. 2024. RP-SLAM: Real-time Photorealistic SLAM with Efficient 3D Gaussian Splatting. arxiv:https:\/\/arXiv.org\/abs\/2412.09868\u00a0[cs.RO] https:\/\/arxiv.org\/abs\/2412.09868"},{"key":"e_1_3_3_2_3_1","doi-asserted-by":"crossref","unstructured":"Carlos Campos Richard Elvira Juan J\u00a0G\u00f3mez Rodr\u00edguez Jos\u00e9\u00a0MM Montiel and Juan\u00a0D Tard\u00f3s. 2021. Orb-slam3: An accurate open-source library for visual visual\u2013inertial and multimap slam. IEEE Transactions on Robotics 37 6 (2021) 1874\u20131890.","DOI":"10.1109\/TRO.2021.3075644"},{"key":"e_1_3_3_2_4_1","doi-asserted-by":"crossref","unstructured":"Yan-Pei Cao Leif Kobbelt and Shi-Min Hu. 2018. Real-time high-accuracy three-dimensional reconstruction with consumer RGB-D cameras. ACM Transactions on Graphics (TOG) 37 5 (2018) 1\u201316.","DOI":"10.1145\/3182157"},{"key":"e_1_3_3_2_5_1","doi-asserted-by":"crossref","unstructured":"Jiawen Chen Dennis Bautembach and Shahram Izadi. 2013. Scalable real-time volumetric surface reconstruction. ACM Trans. Graph. 32 4 (2013) 113\u20131.","DOI":"10.1145\/2461912.2461940"},{"key":"e_1_3_3_2_6_1","doi-asserted-by":"crossref","unstructured":"Angela Dai Matthias Nie\u00dfner Michael Zollh\u00f6fer Shahram Izadi and Christian Theobalt. 2017. Bundlefusion: Real-time globally consistent 3d reconstruction using on-the-fly surface reintegration. ACM Transactions on Graphics (ToG) 36 4 (2017) 1.","DOI":"10.1145\/3072959.3126814"},{"key":"e_1_3_3_2_7_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01261"},{"key":"e_1_3_3_2_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/2030112.2030123"},{"key":"e_1_3_3_2_9_1","unstructured":"Jakob Engel Kiran Somasundaram Michael Goesele Albert Sun Alexander Gamino Andrew Turner Arjang Talattof Arnie Yuan Bilal Souti Brighid Meredith et\u00a0al. 2023. Project aria: A new tool for egocentric multi-modal ai research. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2308.13561 (2023)."},{"key":"e_1_3_3_2_10_1","unstructured":"Dapeng Feng Zhiqiang Chen Yizhen Yin Shipeng Zhong Yuhua Qi and Hongbo Chen. 2024. CaRtGS: Computational Alignment for Real-Time Gaussian Splatting SLAM. arxiv:https:\/\/arXiv.org\/abs\/2410.00486\u00a0[cs.CV] https:\/\/arxiv.org\/abs\/2410.00486"},{"key":"e_1_3_3_2_11_1","doi-asserted-by":"crossref","unstructured":"Jorge Fuentes-Pacheco Jos\u00e9 Ruiz-Ascencio and Juan\u00a0Manuel Rend\u00f3n-Mancha. 2015. Visual simultaneous localization and mapping: a survey. Artificial intelligence review 43 (2015) 55\u201381.","DOI":"10.1007\/s10462-012-9365-8"},{"key":"e_1_3_3_2_12_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-72764-1_11"},{"key":"e_1_3_3_2_13_1","unstructured":"Yan\u00a0Song Hu Nicolas Abboud Muhammad\u00a0Qasim Ali Adam\u00a0Srebrnjak Yang Imad Elhajj Daniel Asmar Yuhao Chen and John\u00a0S. Zelek. 2024. MGSO: Monocular Real-time Photometric SLAM with Efficient 3D Gaussian Splatting. arxiv:https:\/\/arXiv.org\/abs\/2409.13055\u00a0[cs.RO] https:\/\/arxiv.org\/abs\/2409.13055"},{"key":"e_1_3_3_2_14_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.02039"},{"key":"e_1_3_3_2_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00882"},{"key":"e_1_3_3_2_16_1","doi-asserted-by":"crossref","unstructured":"Shi-Sheng Huang Haoxiang Chen Jiahui Huang Hongbo Fu and Shi-Min Hu. 2021a. Real-time globally consistent 3D reconstruction with semantic priors. IEEE transactions on visualization and computer graphics 29 4 (2021) 1977\u20131991.","DOI":"10.1109\/TVCG.2021.3137912"},{"key":"e_1_3_3_2_17_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01670"},{"key":"e_1_3_3_2_18_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.02018"},{"key":"e_1_3_3_2_19_1","doi-asserted-by":"publisher","DOI":"10.1109\/3DV.2013.9"},{"key":"e_1_3_3_2_20_1","doi-asserted-by":"crossref","unstructured":"Bernhard Kerbl Georgios Kopanas Thomas Leimk\u00fchler and George Drettakis. 2023. 3D Gaussian splatting for real-time radiance field rendering. ACM Trans. Graph. 42 4 (2023) 139\u20131.","DOI":"10.1145\/3592433"},{"key":"e_1_3_3_2_21_1","doi-asserted-by":"crossref","unstructured":"Andr\u00e9a Macario\u00a0Barros Maugan Michel Yoann Moline Gwenol\u00e9 Corre and Fr\u00e9d\u00e9rick Carrel. 2022. A comprehensive survey of visual slam algorithms. Robotics 11 1 (2022) 24.","DOI":"10.3390\/robotics11010024"},{"key":"e_1_3_3_2_22_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01708"},{"key":"e_1_3_3_2_23_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58452-8_24"},{"key":"e_1_3_3_2_24_1","doi-asserted-by":"crossref","unstructured":"Thomas M\u00fcller Alex Evans Christoph Schied and Alexander Keller. 2022. Instant neural graphics primitives with a multiresolution hash encoding. ACM Trans. Graph. Article 102 (2022) 15\u00a0pages.","DOI":"10.1145\/3528223.3530127"},{"key":"e_1_3_3_2_25_1","unstructured":"Richard\u00a0A. Newcombe. 2012. Dense Visual SLAM. Ph.\u00a0D. Dissertation. Imperial College London. https:\/\/rapiderobot.bitbucket.io\/papers\/Newcombe-RA-Thesis-2014-compressed.pdf"},{"key":"e_1_3_3_2_26_1","doi-asserted-by":"publisher","DOI":"10.1109\/ISMAR.2011.6092378"},{"key":"e_1_3_3_2_27_1","doi-asserted-by":"crossref","unstructured":"Matthias Nie\u00dfner Michael Zollh\u00f6fer Shahram Izadi and Marc Stamminger. 2013. Real-time 3D reconstruction at scale using voxel hashing. ACM Transactions on Graphics (ToG) 32 6 (2013) 1\u201311.","DOI":"10.1145\/2508363.2508374"},{"key":"e_1_3_3_2_28_1","doi-asserted-by":"publisher","DOI":"10.1145\/3641519.3657455"},{"key":"e_1_3_3_2_29_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01690"},{"key":"e_1_3_3_2_30_1","doi-asserted-by":"crossref","unstructured":"Erik Sandstr\u00f6m Keisuke Tateno Michael Oechsle Michael Niemeyer Luc Van\u00a0Gool Martin\u00a0R Oswald and Federico Tombari. 2024. Splat-SLAM: Globally Optimized RGB-only SLAM with 3D Gaussians. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2405.16544 (2024).","DOI":"10.1109\/CVPRW67362.2025.00156"},{"key":"e_1_3_3_2_31_1","unstructured":"Julian Straub Thomas Whelan Lingni Ma Yufan Chen Erik Wijmans Simon Green Jakob\u00a0J Engel Raul Mur-Artal Carl Ren Shobhit Verma et\u00a0al. 2019. The Replica dataset: A digital replica of indoor spaces. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/1906.05797 (2019)."},{"key":"e_1_3_3_2_32_1","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2012.6385773"},{"key":"e_1_3_3_2_33_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00617"},{"key":"e_1_3_3_2_34_1","unstructured":"Wen Tianci Liu Zhiang Lu Biao and Fang Yongchun. 2025. Scaffold-SLAM: Structured 3D Gaussians for Simultaneous Localization and Photorealistic Mapping. arxiv:https:\/\/arXiv.org\/abs\/2501.05242\u00a0[cs.CV] https:\/\/arxiv.org\/abs\/2501.05242"},{"key":"e_1_3_3_2_35_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01277"},{"key":"e_1_3_3_2_36_1","unstructured":"Meng Wang Junyi Wang Changqun Xia Chen Wang and Yue Qi. 2024. OG-Mapping: Octree-based Structured 3D Gaussians for Online Dense Mapping. arxiv:https:\/\/arXiv.org\/abs\/2408.17223\u00a0[cs.CV] https:\/\/arxiv.org\/abs\/2408.17223"},{"key":"e_1_3_3_2_37_1","doi-asserted-by":"crossref","unstructured":"Zhou Wang Alan\u00a0C Bovik Hamid\u00a0R Sheikh and Eero\u00a0P Simoncelli. 2004. Image quality assessment: from error visibility to structural similarity. IEEE transactions on image processing 13 4 (2004) 600\u2013612.","DOI":"10.1109\/TIP.2003.819861"},{"key":"e_1_3_3_2_38_1","first-page":"3","volume-title":"Robotics: science and systems","author":"Whelan Thomas","year":"2015","unstructured":"Thomas Whelan, Stefan Leutenegger, Renato\u00a0F Salas-Moreno, Ben Glocker, and Andrew\u00a0J Davison. 2015. ElasticFusion: Dense SLAM without a pose graph.. In Robotics: science and systems , Vol.\u00a011. Rome, Italy, 3."},{"key":"e_1_3_3_2_39_1","doi-asserted-by":"crossref","unstructured":"Yabin Xu Liangliang Nan Laishui Zhou Jun Wang and Charlie\u00a0CL Wang. 2022. Hrbf-fusion: Accurate 3d reconstruction from rgb-d data using on-the-fly implicits. ACM Transactions on Graphics (TOG) 41 3 (2022) 1\u201319.","DOI":"10.1145\/3516521"},{"key":"e_1_3_3_2_40_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01853"},{"key":"e_1_3_3_2_41_1","doi-asserted-by":"publisher","DOI":"10.1109\/ISMAR55827.2022.00066"},{"key":"e_1_3_3_2_42_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52733.2024.01839"},{"key":"e_1_3_3_2_43_1","unstructured":"Vladimir Yugay Yue Li Theo Gevers and Martin\u00a0R Oswald. 2023. Gaussian-slam: Photo-realistic dense slam with gaussian splatting. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2312.10070 (2023)."},{"key":"e_1_3_3_2_44_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00068"},{"key":"e_1_3_3_2_45_1","doi-asserted-by":"crossref","unstructured":"Wei Zhang Qing Cheng David Skuddis Niclas Zeller Daniel Cremers and Norbert Haala. 2024. HI-SLAM2: Geometry-Aware Gaussian SLAM for Fast Monocular Scene Reconstruction. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2411.17982 (2024).","DOI":"10.1109\/TRO.2025.3626627"},{"key":"e_1_3_3_2_46_1","doi-asserted-by":"crossref","unstructured":"Yizhong Zhang Weiwei Xu Yiying Tong and Kun Zhou. 2015. Online structure analysis for real-time indoor scene reconstruction. ACM Transactions on Graphics (TOG) 34 5 (2015) 1\u201313.","DOI":"10.1145\/2768821"},{"key":"e_1_3_3_2_47_1","unstructured":"Yang Zhou Songyin Wu and Ling-Qi Yan. 2024. Unified Gaussian Primitives for Scene Representation and Rendering. arxiv:https:\/\/arXiv.org\/abs\/2406.09733\u00a0[cs.GR] https:\/\/arxiv.org\/abs\/2406.09733"},{"key":"e_1_3_3_2_48_1","doi-asserted-by":"publisher","DOI":"10.1109\/3DV62453.2024.00096"},{"key":"e_1_3_3_2_49_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01245"},{"key":"e_1_3_3_2_50_1","doi-asserted-by":"publisher","DOI":"10.1111\/cgf.13386"}],"event":{"name":"SIGGRAPH Conference Papers '25: Special Interest Group on Computer Graphics and Interactive Techniques Conference Conference Papers","location":"Vancouver BC Canada","acronym":"SIGGRAPH Conference Papers '25","sponsor":["SIGGRAPH ACM Special Interest Group on Computer Graphics and Interactive Techniques"]},"container-title":["Proceedings of the Special Interest Group on Computer Graphics and Interactive Techniques Conference Conference Papers"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3721238.3730659","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,20]],"date-time":"2026-03-20T14:52:17Z","timestamp":1774018337000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3721238.3730659"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,7,27]]},"references-count":49,"alternative-id":["10.1145\/3721238.3730659","10.1145\/3721238"],"URL":"https:\/\/doi.org\/10.1145\/3721238.3730659","relation":{},"subject":[],"published":{"date-parts":[[2025,7,27]]},"assertion":[{"value":"2025-07-27","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}