{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,2]],"date-time":"2025-11-02T19:23:20Z","timestamp":1762111400051,"version":"build-2065373602"},"publisher-location":"Cham","reference-count":57,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031734106"},{"type":"electronic","value":"9783031734113"}],"license":[{"start":{"date-parts":[[2024,11,23]],"date-time":"2024-11-23T00:00:00Z","timestamp":1732320000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,11,23]],"date-time":"2024-11-23T00:00:00Z","timestamp":1732320000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-73411-3_11","type":"book-chapter","created":{"date-parts":[[2024,11,22]],"date-time":"2024-11-22T20:08:09Z","timestamp":1732306089000},"page":"183-200","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Surface-Centric Modeling for\u00a0High-Fidelity Generalizable Neural Surface Reconstruction"],"prefix":"10.1007","author":[{"given":"Rui","family":"Peng","sequence":"first","affiliation":[]},{"given":"Shihe","family":"Shen","sequence":"additional","affiliation":[]},{"given":"Kaiqiang","family":"Xiong","sequence":"additional","affiliation":[]},{"given":"Huachen","family":"Gao","sequence":"additional","affiliation":[]},{"given":"Jianbo","family":"Jiao","sequence":"additional","affiliation":[]},{"given":"Xiaodong","family":"Gu","sequence":"additional","affiliation":[]},{"given":"Ronggang","family":"Wang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,11,23]]},"reference":[{"key":"11_CR1","doi-asserted-by":"crossref","unstructured":"Aan\u00e6s, H., Jensen, R.R., Vogiatzis, G., Tola, E., Dahl, A.B.: Large-scale data for multiple-view stereopsis. IJCV 120, 153\u2013168 (2016)","DOI":"10.1007\/s11263-016-0902-9"},{"key":"11_CR2","doi-asserted-by":"crossref","unstructured":"Barron, J.T., Mildenhall, B., Tancik, M., Hedman, P., Martin-Brualla, R., Srinivasan, P.P.: Mip-nerf: a multiscale representation for anti-aliasing neural radiance fields. In: ICCV, pp. 5855\u20135864 (2021)","DOI":"10.1109\/ICCV48922.2021.00580"},{"key":"11_CR3","doi-asserted-by":"crossref","unstructured":"Campbell, N.D., Vogiatzis, G., Hern\u00e1ndez, C., Cipolla, R.: Using multiple hypotheses to improve depth-maps for multi-view stereo. In: ECCV, pp. 766\u2013779 (2008)","DOI":"10.1007\/978-3-540-88682-2_58"},{"key":"11_CR4","doi-asserted-by":"crossref","unstructured":"Chang, D., et al.: Rc-mvsnet: unsupervised multi-view stereo with neural rendering. In: ECCV (2022)","DOI":"10.1007\/978-3-031-19821-2_38"},{"key":"11_CR5","doi-asserted-by":"crossref","unstructured":"Chen, A., et al.: Mvsnerf: fast generalizable radiance field reconstruction from multi-view stereo. In: ICCV, pp. 14124\u201314133 (2021)","DOI":"10.1109\/ICCV48922.2021.01386"},{"key":"11_CR6","unstructured":"Chen, H., Li, C., Lee, G.H.: Neusg: Neural implicit surface reconstruction with 3d gaussian splatting guidance. arXiv preprint arXiv:2312.00846 (2023)"},{"issue":"8","key":"11_CR7","doi-asserted-by":"publisher","first-page":"1362","DOI":"10.1109\/TPAMI.2009.161","volume":"32","author":"Y Furukawa","year":"2009","unstructured":"Furukawa, Y., Ponce, J.: Accurate, dense, and robust multiview stereopsis. IEEE TPAMI 32(8), 1362\u20131376 (2009)","journal-title":"IEEE TPAMI"},{"key":"11_CR8","doi-asserted-by":"crossref","unstructured":"Galliani, S., Lasinger, K., Schindler, K.: Massively parallel multiview stereopsis by surface normal diffusion. In: ICCV, pp. 873\u2013881 (2015)","DOI":"10.1109\/ICCV.2015.106"},{"key":"11_CR9","doi-asserted-by":"crossref","unstructured":"Godard, C., Mac\u00a0Aodha, O., Firman, M., Brostow, G.J.: Digging into self-supervised monocular depth estimation. In: ICCV, pp. 3828\u20133838 (2019)","DOI":"10.1109\/ICCV.2019.00393"},{"key":"11_CR10","unstructured":"Gropp, A., Yariv, L., Haim, N., Atzmon, M., Lipman, Y.: Implicit geometric regularization for learning shapes. In: MLSys, pp. 3569\u20133579 (2020)"},{"key":"11_CR11","doi-asserted-by":"crossref","unstructured":"Gu, X., Fan, Z., Zhu, S., Dai, Z., Tan, F., Tan, P.: Cascade cost volume for high-resolution multi-view stereo and stereo matching. In: CVPR, pp. 2495\u20132504 (2020)","DOI":"10.1109\/CVPR42600.2020.00257"},{"key":"11_CR12","doi-asserted-by":"crossref","unstructured":"Gu\u00e9don, A., Lepetit, V.: Sugar: saurface-aligned gaussian splatting for efficient 3D mesh reconstruction and high-quality mesh rendering. In: CVPR (2024)","DOI":"10.1109\/CVPR52733.2024.00512"},{"key":"11_CR13","unstructured":"Hong, Y., et al.: Lrm: large reconstruction model for single image to 3d. In: ICLR (2024)"},{"key":"11_CR14","doi-asserted-by":"crossref","unstructured":"Johari, M.M., Lepoittevin, Y., Fleuret, F.: Geonerf: generalizing nerf with geometry priors. In: CVPR, pp. 18365\u201318375 (2022)","DOI":"10.1109\/CVPR52688.2022.01782"},{"key":"11_CR15","doi-asserted-by":"crossref","unstructured":"Kazhdan, M., Hoppe, H.: Screened poisson surface reconstruction. ACM ToG 32(3), 1\u201313 (2013)","DOI":"10.1145\/2487228.2487237"},{"key":"11_CR16","doi-asserted-by":"crossref","unstructured":"Kerbl, B., Kopanas, G., Leimk\u00fchler, T., Drettakis, G.: 3d gaussian splatting for real-time radiance field rendering. ACM TOG 42(4) (2023)","DOI":"10.1145\/3592433"},{"key":"11_CR17","unstructured":"Kingma, D.P., Ba, J.: Adam: A method for stochastic optimization. In: ICLR (2014)"},{"issue":"4","key":"11_CR18","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3072959.3073599","volume":"36","author":"A Knapitsch","year":"2017","unstructured":"Knapitsch, A., Park, J., Zhou, Q.Y., Koltun, V.: Tanks and temples: benchmarking large-scale scene reconstruction. ACM Trans. Graph. (ToG) 36(4), 1\u201313 (2017)","journal-title":"ACM Trans. Graph. (ToG)"},{"key":"11_CR19","doi-asserted-by":"publisher","first-page":"199","DOI":"10.1023\/A:1008191222954","volume":"38","author":"KN Kutulakos","year":"2000","unstructured":"Kutulakos, K.N., Seitz, S.M.: A theory of shape by space carving. IJCV 38, 199\u2013218 (2000)","journal-title":"IJCV"},{"issue":"3","key":"11_CR20","doi-asserted-by":"publisher","first-page":"418","DOI":"10.1109\/TPAMI.2005.44","volume":"27","author":"M Lhuillier","year":"2005","unstructured":"Lhuillier, M., Quan, L.: A quasi-dense approach to surface reconstruction from uncalibrated images. IEEE TPAMI 27(3), 418\u2013433 (2005)","journal-title":"IEEE TPAMI"},{"key":"11_CR21","unstructured":"Li, J., et al.: Instant3d: Fast text-to-3d with sparse-view generation and large reconstruction model. In: ICLR (2024)"},{"key":"11_CR22","unstructured":"Liang, Y., He, H., Chen, Y.c.: Rethinking rendering in generalizable neural surface reconstruction: a learning-based solution. In: NeurIPS (2023)"},{"key":"11_CR23","doi-asserted-by":"crossref","unstructured":"Lin, T.Y., Doll\u00e1r, P., Girshick, R., He, K., Hariharan, B., Belongie, S.: Feature pyramid networks for object detection. In: CVPR, pp. 2117\u20132125 (2017)","DOI":"10.1109\/CVPR.2017.106"},{"key":"11_CR24","doi-asserted-by":"crossref","unstructured":"Long, X., Lin, C., Wang, P., Komura, T., Wang, W.: Sparseneus: fast generalizable neural surface reconstruction from sparse views. In: ECCV, pp. 210\u2013227 (2022)","DOI":"10.1007\/978-3-031-19824-3_13"},{"key":"11_CR25","doi-asserted-by":"crossref","unstructured":"Lorensen, W.E., Cline, H.E.: Marching cubes: a high resolution 3d surface construction algorithm. In: ACM siggraph computer graphics (1987)","DOI":"10.1145\/37401.37422"},{"key":"11_CR26","doi-asserted-by":"crossref","unstructured":"Mescheder, L., Oechsle, M., Niemeyer, M., Nowozin, S., Geiger, A.: Occupancy networks: learning 3D reconstruction in function space. In: CVPR, pp. 4460\u20134470 (2019)","DOI":"10.1109\/CVPR.2019.00459"},{"key":"11_CR27","doi-asserted-by":"crossref","unstructured":"Mildenhall, B., Srinivasan, P.P., Tancik, M., Barron, J.T., Ramamoorthi, R., Ng, R.: Nerf: representing scenes as neural radiance fields for view synthesis. In: ECCV (2020)","DOI":"10.1007\/978-3-030-58452-8_24"},{"key":"11_CR28","doi-asserted-by":"crossref","unstructured":"M\u00fcller, T., Evans, A., Schied, C., Keller, A.: Instant neural graphics primitives with a multiresolution hash encoding. In: SIGGRAPH (2022)","DOI":"10.1145\/3528223.3530127"},{"key":"11_CR29","doi-asserted-by":"crossref","unstructured":"Niemeyer, M., Mescheder, L., Oechsle, M., Geiger, A.: Differentiable volumetric rendering: learning implicit 3d representations without 3D supervision. In: CVPR, pp. 3504\u20133515 (2020)","DOI":"10.1109\/CVPR42600.2020.00356"},{"issue":"6","key":"11_CR30","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/2508363.2508374","volume":"32","author":"M Nie\u00dfner","year":"2013","unstructured":"Nie\u00dfner, M., Zollh\u00f6fer, M., Izadi, S., Stamminger, M.: Real-time 3d reconstruction at scale using voxel hashing. ACM ToG 32(6), 1\u201311 (2013)","journal-title":"ACM ToG"},{"key":"11_CR31","doi-asserted-by":"crossref","unstructured":"Oechsle, M., Mescheder, L., Niemeyer, M., Strauss, T., Geiger, A.: Texture fields: Learning texture representations in function space. In: ICCV, pp. 4531\u20134540 (2019)","DOI":"10.1109\/ICCV.2019.00463"},{"key":"11_CR32","doi-asserted-by":"crossref","unstructured":"Oechsle, M., Peng, S., Geiger, A.: Unisurf: Unifying neural implicit surfaces and radiance fields for multi-view reconstruction. In: ICCV, pp. 5589\u20135599 (2021)","DOI":"10.1109\/ICCV48922.2021.00554"},{"key":"11_CR33","doi-asserted-by":"crossref","unstructured":"Park, J.J., Florence, P., Straub, J., Newcombe, R., Lovegrove, S.: Deepsdf: learning continuous signed distance functions for shape representation. In: CVPR, pp. 165\u2013174 (2019)","DOI":"10.1109\/CVPR.2019.00025"},{"key":"11_CR34","unstructured":"Peng, R., Gu, X., Tang, L., Shen, S., Yu, F., Wang, R.: Gens: Generalizable neural surface reconstruction from multi-view images. In: NeurIPS (2023)"},{"key":"11_CR35","doi-asserted-by":"crossref","unstructured":"Peng, R., Wang, R., Lai, Y., Tang, L., Cai, Y.: Excavating the potential capacity of self-supervised monocular depth estimation. In: ICCV, pp. 15560\u201315569 (2021)","DOI":"10.1109\/ICCV48922.2021.01527"},{"key":"11_CR36","doi-asserted-by":"crossref","unstructured":"Peng, R., Wang, R., Wang, Z., Lai, Y., Wang, R.: Rethinking depth estimation for multi-view stereo: a unified representation. In: CVPR, pp. 8645\u20138654 (2022)","DOI":"10.1109\/CVPR52688.2022.00845"},{"key":"11_CR37","doi-asserted-by":"crossref","unstructured":"Ren, Y., Zhang, T., Pollefeys, M., S\u00fcsstrunk, S., Wang, F.: Volrecon: volume rendering of signed ray distance functions for generalizable multi-view reconstruction. In: CVPR, pp. 16685\u201316695 (2023)","DOI":"10.1109\/CVPR52729.2023.01601"},{"key":"11_CR38","doi-asserted-by":"crossref","unstructured":"Schonberger, J.L., Frahm, J.M.: Structure-from-motion revisited. In: CVPR, pp. 4104\u20134113 (2016)","DOI":"10.1109\/CVPR.2016.445"},{"key":"11_CR39","doi-asserted-by":"crossref","unstructured":"Sch\u00f6nberger, J.L., Zheng, E., Frahm, J.M., Pollefeys, M.: Pixelwise view selection for unstructured multi-view stereo. In: ECCV, pp. 501\u2013518 (2016)","DOI":"10.1007\/978-3-319-46487-9_31"},{"key":"11_CR40","doi-asserted-by":"crossref","unstructured":"Schops, T., et al.: A multi-view stereo benchmark with high-resolution images and multi-camera videos. In: CVPR, pp. 3260\u20133269 (2017)","DOI":"10.1109\/CVPR.2017.272"},{"key":"11_CR41","doi-asserted-by":"publisher","first-page":"151","DOI":"10.1023\/A:1008176507526","volume":"35","author":"SM Seitz","year":"1999","unstructured":"Seitz, S.M., Dyer, C.R.: Photorealistic scene reconstruction by voxel coloring. IJCV 35, 151\u2013173 (1999)","journal-title":"IJCV"},{"key":"11_CR42","unstructured":"Wang, P., Liu, L., Liu, Y., Theobalt, C., Komura, T., Wang, W.: Neus: learning neural implicit surfaces by volume rendering for multi-view reconstruction. In: NeurIPS (2021)"},{"key":"11_CR43","doi-asserted-by":"crossref","unstructured":"Wang, Q., et al.: Ibrnet: Learning multi-view image-based rendering. In: CVPR, pp. 4690\u20134699 (2021)","DOI":"10.1109\/CVPR46437.2021.00466"},{"key":"11_CR44","doi-asserted-by":"crossref","unstructured":"Wang, Y., Han, Q., Habermann, M., Daniilidis, K., Theobalt, C., Liu, L.: Neus2: fast learning of neural implicit surfaces for multi-view reconstruction. In: ICCV, pp. 3295\u20133306 (2023)","DOI":"10.1109\/ICCV51070.2023.00305"},{"key":"11_CR45","unstructured":"Wang, Y., Skorokhodov, I., Wonka, P.: Hf-neus: improved surface reconstruction using high-frequency details. In: NeurIPS (2022)"},{"issue":"4","key":"11_CR46","first-page":"600","volume":"13","author":"Z Wang","year":"2004","unstructured":"Wang, Z., Bovik, A.C., Sheikh, H.R., Simoncelli, E.P.: Image quality assessment: from error visibility to structural similarity. IEEE TIP 13(4), 600\u2013612 (2004)","journal-title":"IEEE TIP"},{"key":"11_CR47","unstructured":"Wu, T., et al.: Voxurf: voxel-based efficient and accurate neural surface reconstruction. In: ICLR (2022)"},{"key":"11_CR48","doi-asserted-by":"crossref","unstructured":"Xu, L., et al.: C2f2neus: cascade cost frustum fusion for high fidelity and generalizable neural surface reconstruction. In: ICCV (2023)","DOI":"10.1109\/ICCV51070.2023.01677"},{"key":"11_CR49","doi-asserted-by":"crossref","unstructured":"Yao, Y., Luo, Z., Li, S., Fang, T., Quan, L.: Mvsnet: depth inference for unstructured multi-view stereo. In: ECCV, pp. 767\u2013783 (2018)","DOI":"10.1007\/978-3-030-01237-3_47"},{"key":"11_CR50","doi-asserted-by":"crossref","unstructured":"Yao, Y., et al.: Blendedmvs: a large-scale dataset for generalized multi-view stereo networks. In: CVPR, pp. 1790\u20131799 (2020)","DOI":"10.1109\/CVPR42600.2020.00186"},{"key":"11_CR51","first-page":"4805","volume":"34","author":"L Yariv","year":"2021","unstructured":"Yariv, L., Gu, J., Kasten, Y., Lipman, Y.: Volume rendering of neural implicit surfaces. NeurIPS 34, 4805\u20134815 (2021)","journal-title":"NeurIPS"},{"key":"11_CR52","first-page":"2492","volume":"33","author":"L Yariv","year":"2020","unstructured":"Yariv, L., et al.: Multiview neural surface reconstruction by disentangling geometry and appearance. NeurIPS 33, 2492\u20132502 (2020)","journal-title":"NeurIPS"},{"key":"11_CR53","doi-asserted-by":"crossref","unstructured":"Yu, A., Ye, V., Tancik, M., Kanazawa, A.: pixelnerf: neural radiance fields from one or few images. In: CVPR, pp. 4578\u20134587 (2021)","DOI":"10.1109\/CVPR46437.2021.00455"},{"key":"11_CR54","unstructured":"Yu, Z., Peng, S., Niemeyer, M., Sattler, T., Geiger, A.: Monosdf: exploring monocular geometric cues for neural implicit surface reconstruction. In: NeurIPS (2022)"},{"key":"11_CR55","unstructured":"Zhang, J., et al.: Critical regularizations for neural surface reconstruction in the wild. In: CVPR, pp. 6270\u20136279 (2022)"},{"key":"11_CR56","doi-asserted-by":"crossref","unstructured":"Zhang, J., Yao, Y., Quan, L.: Learning signed distance field for multi-view surface reconstruction. In: ICCV, pp. 6525\u20136534 (2021)","DOI":"10.1109\/ICCV48922.2021.00646"},{"issue":"6","key":"11_CR57","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3478513.3480500","volume":"40","author":"X Zhang","year":"2021","unstructured":"Zhang, X., Srinivasan, P.P., Deng, B., Debevec, P., Freeman, W.T., Barron, J.T.: Nerfactor: neural factorization of shape and reflectance under an unknown illumination. ACM ToG 40(6), 1\u201318 (2021)","journal-title":"ACM ToG"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2024"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-73411-3_11","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,22]],"date-time":"2024-11-22T21:25:05Z","timestamp":1732310705000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-73411-3_11"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,23]]},"ISBN":["9783031734106","9783031734113"],"references-count":57,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-73411-3_11","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2024,11,23]]},"assertion":[{"value":"23 November 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Milan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2024.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}