{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,21]],"date-time":"2026-05-21T17:33:57Z","timestamp":1779384837313,"version":"3.53.1"},"publisher-location":"Cham","reference-count":72,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031734106","type":"print"},{"value":"9783031734113","type":"electronic"}],"license":[{"start":{"date-parts":[[2024,11,23]],"date-time":"2024-11-23T00:00:00Z","timestamp":1732320000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,11,23]],"date-time":"2024-11-23T00:00:00Z","timestamp":1732320000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-73411-3_27","type":"book-chapter","created":{"date-parts":[[2024,11,22]],"date-time":"2024-11-22T20:06:58Z","timestamp":1732306018000},"page":"473-491","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":9,"title":["Leveraging Near-Field Lighting for\u00a0Monocular Depth Estimation from\u00a0Endoscopy Videos"],"prefix":"10.1007","author":[{"given":"Akshay","family":"Paruchuri","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Samuel","family":"Ehrenstein","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Shuxian","family":"Wang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Inbar","family":"Fried","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Stephen M.","family":"Pizer","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Marc","family":"Niethammer","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Roni","family":"Sengupta","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2024,11,23]]},"reference":[{"issue":"11","key":"27_CR1","doi-asserted-by":"publisher","first-page":"3329","DOI":"10.21037\/jtd.2016.11.81","volume":"8","author":"M Andolfi","year":"2016","unstructured":"Andolfi, M., Potenza, R., Capozzi, R., Liparulo, V., Puma, F., Yasufuku, K.: The role of bronchoscopy in the diagnosis of early lung cancer: a review. J. Thorac. Dis. 8(11), 3329 (2016)","journal-title":"J. Thorac. Dis."},{"key":"27_CR2","unstructured":"Anonymous: Structure-preserving image translation for depth estimation in colonoscopy (2024), paper submitted to another conference that releases a portion of the clinical data used in this paper"},{"key":"27_CR3","doi-asserted-by":"publisher","unstructured":"Azagra, P., et al.: Endomapper dataset of complete calibrated endoscopy procedures. Sci. Data 10(1) (2023). https:\/\/doi.org\/10.1038\/s41597-023-02564-7. http:\/\/dx.doi.org\/10.1038\/s41597-023-02564-7","DOI":"10.1038\/s41597-023-02564-7"},{"key":"27_CR4","unstructured":"Bae, G., Budvytis, I., Cipolla, R.: IronDepth: iterative refinement of single-view depth using surface normal and its uncertainty. arXiv preprint arXiv:2210.03676 (2022)"},{"key":"27_CR5","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"774","DOI":"10.1007\/978-3-030-59716-0_74","volume-title":"Medical Image Computing and Computer Assisted Intervention \u2013 MICCAI 2020","author":"G Bae","year":"2020","unstructured":"Bae, G., Budvytis, I., Yeung, C.-K., Cipolla, R.: Deep multi-view stereo for dense 3D reconstruction from monocular endoscopic video. In: Martel, A.L., et al. (eds.) MICCAI 2020. LNCS, vol. 12263, pp. 774\u2013783. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-59716-0_74"},{"key":"27_CR6","doi-asserted-by":"publisher","first-page":"239","DOI":"10.1007\/s11263-006-8815-7","volume":"72","author":"R Basri","year":"2007","unstructured":"Basri, R., Jacobs, D., Kemelmacher, I.: Photometric stereo with general, unknown lighting. Int. J. Comput. Vision 72, 239\u2013257 (2007)","journal-title":"Int. J. Comput. Vision"},{"issue":"1","key":"27_CR7","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1007\/s004649900002","volume":"14","author":"G Berci","year":"2000","unstructured":"Berci, G., Forde, K.A.: History of endoscopy. Surg. Endosc. 14(1), 5\u201315 (2000)","journal-title":"Surg. Endosc."},{"key":"27_CR8","doi-asserted-by":"publisher","unstructured":"Bobrow, T.L., Golhar, M., Vijayan, R., Akshintala, V.S., Garcia, J.R., Durr, N.J.: Colonoscopy 3D video dataset with paired depth from 2D-3D registration. Med. Image Anal. 90, 102956 (2023). https:\/\/doi.org\/10.1016\/j.media.2023.102956. http:\/\/dx.doi.org\/10.1016\/j.media.2023.102956","DOI":"10.1016\/j.media.2023.102956"},{"key":"27_CR9","unstructured":"Chen, W., Fu, Z., Yang, D., Deng, J.: Single-image depth perception in the wild. Adv. Neural Inf. Process. Syst. 29 (2016)"},{"key":"27_CR10","doi-asserted-by":"crossref","unstructured":"Eftekhar, A., Sax, A., Bachmann, R., Malik, J., Zamir, A.: OmniData: a scalable pipeline for making multi-task mid-level vision datasets from 3D scans (2021)","DOI":"10.1109\/ICCV48922.2021.01061"},{"key":"27_CR11","unstructured":"Eigen, D., Puhrsch, C., Fergus, R.: Depth map prediction from a single image using a multi-scale deep network. Adv. Neural Inf. Process. Syst. 27 (2014)"},{"issue":"9","key":"27_CR12","doi-asserted-by":"publisher","first-page":"1066","DOI":"10.1164\/rccm.201503-0474ST","volume":"191","author":"A Faro","year":"2015","unstructured":"Faro, A., et al.: Official American thoracic society technical standards: flexible airway endoscopy in children. Am. J. Respir. Crit. Care Med. 191(9), 1066\u20131080 (2015)","journal-title":"Am. J. Respir. Crit. Care Med."},{"key":"27_CR13","doi-asserted-by":"crossref","unstructured":"Fu, H., Gong, M., Wang, C., Batmanghelich, K., Tao, D.: Deep ordinal regression network for monocular depth estimation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2002\u20132011 (2018)","DOI":"10.1109\/CVPR.2018.00214"},{"key":"27_CR14","unstructured":"Furlanello, T., Lipton, Z., Tschannen, M., Itti, L., Anandkumar, A.: Born again neural networks. In: International Conference on Machine Learning, pp. 1607\u20131616. PMLR (2018)"},{"key":"27_CR15","doi-asserted-by":"crossref","unstructured":"Godard, C., Aodha, O.M., Firman, M., Brostow, G.: Digging into self-supervised monocular depth estimation (2019)","DOI":"10.1109\/ICCV.2019.00393"},{"key":"27_CR16","doi-asserted-by":"publisher","first-page":"1789","DOI":"10.1007\/s11263-021-01453-z","volume":"129","author":"J Gou","year":"2021","unstructured":"Gou, J., Yu, B., Maybank, S.J., Tao, D.: Knowledge distillation: a survey. Int. J. Comput. Vision 129, 1789\u20131819 (2021)","journal-title":"Int. J. Comput. Vision"},{"key":"27_CR17","unstructured":"Grand View Research: Endoscopy procedures estimates market volume, share & trends analysis report by application (gastroscopy, colonoscopy, laparoscopy), by region (North America, Asia Pacific, Europe), and segment forecasts, 2023 - 2030 (2023). https:\/\/www.grandviewresearch.com\/industry-analysis\/endoscopy-procedures-estimates-market-report"},{"issue":"4","key":"27_CR18","doi-asserted-by":"publisher","first-page":"543","DOI":"10.1016\/j.media.2009.05.004","volume":"13","author":"T Heimann","year":"2009","unstructured":"Heimann, T., Meinzer, H.P.: Statistical shape models for 3d medical image segmentation: a review. Med. Image Anal. 13(4), 543\u2013563 (2009)","journal-title":"Med. Image Anal."},{"key":"27_CR19","unstructured":"Hinton, G., Vinyals, O., Dean, J.: Distilling the knowledge in a neural network. arXiv preprint arXiv:1503.02531 (2015)"},{"key":"27_CR20","doi-asserted-by":"publisher","first-page":"151","DOI":"10.1007\/s11263-006-0031-y","volume":"75","author":"D Hoiem","year":"2007","unstructured":"Hoiem, D., Efros, A.A., Hebert, M.: Recovering surface layout from an image. Int. J. Comput. Vision 75, 151\u2013172 (2007)","journal-title":"Int. J. Comput. Vision"},{"issue":"8","key":"27_CR21","doi-asserted-by":"publisher","first-page":"2691","DOI":"10.3390\/s21082691","volume":"21","author":"SJ Hwang","year":"2021","unstructured":"Hwang, S.J., Park, S.J., Kim, G.M., Baek, J.H.: Unsupervised monocular depth estimation for colonoscope system using feedback network. Sensors 21(8), 2691 (2021)","journal-title":"Sensors"},{"issue":"3","key":"27_CR22","doi-asserted-by":"publisher","first-page":"309","DOI":"10.1177\/2050640617700014","volume":"5","author":"MF Kaminski","year":"2017","unstructured":"Kaminski, M.F., et al.: Performance measures for lower gastrointestinal endoscopy: a European society of gastrointestinal endoscopy (ESGE) quality improvement initiative. United Eur. Gastroenterol. J. 5(3), 309\u2013334 (2017)","journal-title":"United Eur. Gastroenterol. J."},{"key":"27_CR23","series-title":"Mathematics and Visualization","doi-asserted-by":"publisher","first-page":"61","DOI":"10.1007\/978-3-540-72630-2_4","volume-title":"Visualization in Medicine and Life Sciences","author":"A Kaufman","year":"2008","unstructured":"Kaufman, A., Wang, J.: 3D surface reconstruction from endoscopic videos. In: Linsen, L., Hagen, H., Hamann, B. (eds.) Visualization in Medicine and Life Sciences. Mathematics and Visualization, pp. 61\u201374. Springer, Heidelberg (2008). https:\/\/doi.org\/10.1007\/978-3-540-72630-2_4"},{"key":"27_CR24","doi-asserted-by":"crossref","unstructured":"Ke, B., Obukhov, A., Huang, S., Metzger, N., Daudt, R.C., Schindler, K.: Repurposing diffusion-based image generators for monocular depth estimation (2023)","DOI":"10.1109\/CVPR52733.2024.00907"},{"key":"27_CR25","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"596","DOI":"10.1007\/978-3-030-01267-0_35","volume-title":"Computer Vision \u2013 ECCV 2018","author":"S Khamis","year":"2018","unstructured":"Khamis, S., Fanello, S., Rhemann, C., Kowdle, A., Valentin, J., Izadi, S.: StereoNet: guided hierarchical refinement for real-time edge-aware depth prediction. In: Ferrari, V., Hebert, M., Sminchisescu, C., Weiss, Y. (eds.) ECCV 2018. LNCS, vol. 11219, pp. 596\u2013613. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-030-01267-0_35"},{"key":"27_CR26","doi-asserted-by":"crossref","unstructured":"Kim, S.Y., et al.: Layered depth refinement with mask guidance. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 3855\u20133865 (2022)","DOI":"10.1109\/CVPR52688.2022.00383"},{"key":"27_CR27","unstructured":"Kingma, D.P., Ba, J.: Adam: a method for stochastic optimization. arXiv preprint arXiv:1412.6980 (2014)"},{"issue":"3","key":"27_CR28","doi-asserted-by":"publisher","first-page":"130","DOI":"10.1038\/nrclinonc.2013.12","volume":"10","author":"EJ Kuipers","year":"2013","unstructured":"Kuipers, E.J., R\u00f6sch, T., Bretthauer, M.: Colorectal cancer screening-optimizing current strategies and new directions. Nat. Rev. Clin. Oncol. 10(3), 130\u2013142 (2013)","journal-title":"Nat. Rev. Clin. Oncol."},{"key":"27_CR29","doi-asserted-by":"crossref","unstructured":"Kusupati, U., Cheng, S., Chen, R., Su, H.: Normal assisted stereo depth estimation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 2189\u20132199 (2020)","DOI":"10.1109\/CVPR42600.2020.00226"},{"key":"27_CR30","doi-asserted-by":"crossref","unstructured":"Kwon, H., Tai, Y.W., Lin, S.: Data-driven depth map refinement via multi-scale sparse representation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 159\u2013167 (2015)","DOI":"10.1109\/CVPR.2015.7298611"},{"key":"27_CR31","doi-asserted-by":"crossref","unstructured":"Laina, I., Rupprecht, C., Belagiannis, V., Tombari, F., Navab, N.: Deeper depth prediction with fully convolutional residual networks. In: 2016 Fourth International Conference on 3D Vision (3DV), pp. 239\u2013248. IEEE (2016)","DOI":"10.1109\/3DV.2016.32"},{"key":"27_CR32","doi-asserted-by":"crossref","unstructured":"Lichy, D., Sengupta, S., Jacobs, D.W.: Fast light-weight near-field photometric stereo (2022)","DOI":"10.1109\/CVPR52688.2022.01228"},{"key":"27_CR33","doi-asserted-by":"crossref","unstructured":"Lichy, D., Wu, J., Sengupta, S., Jacobs, D.W.: Shape and material capture at home. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 6123\u20136133 (2021)","DOI":"10.1109\/CVPR46437.2021.00606"},{"key":"27_CR34","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"28","DOI":"10.1007\/978-3-540-88690-7_3","volume-title":"Computer Vision \u2013 ECCV 2008","author":"C Liu","year":"2008","unstructured":"Liu, C., Yuen, J., Torralba, A., Sivic, J., Freeman, W.T.: SIFT flow: dense correspondence across different scenes. In: Forsyth, D., Torr, P., Zisserman, A. (eds.) ECCV 2008. LNCS, vol. 5304, pp. 28\u201342. Springer, Heidelberg (2008). https:\/\/doi.org\/10.1007\/978-3-540-88690-7_3"},{"issue":"5","key":"27_CR35","doi-asserted-by":"publisher","first-page":"1438","DOI":"10.1109\/TMI.2019.2950936","volume":"39","author":"X Liu","year":"2019","unstructured":"Liu, X., et al.: Dense depth estimation in monocular endoscopy with self-supervised learning methods. IEEE Trans. Med. Imaging 39(5), 1438\u20131447 (2019)","journal-title":"IEEE Trans. Med. Imaging"},{"key":"27_CR36","unstructured":"Logothetis, F., Budvytis, I., Mecca, R., Cipolla, R.: A CNN based approach for the near-field photometric stereo problem. arXiv preprint arXiv:2009.05792 (2020)"},{"key":"27_CR37","doi-asserted-by":"crossref","unstructured":"Logothetis, F., Mecca, R., Cipolla, R.: A differential volumetric approach to multi-view photometric stereo. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 1052\u20131061 (2019)","DOI":"10.1109\/ICCV.2019.00114"},{"key":"27_CR38","unstructured":"Loshchilov, I., Hutter, F.: Decoupled weight decay regularization. arXiv preprint arXiv:1711.05101 (2017)"},{"issue":"6","key":"27_CR39","doi-asserted-by":"publisher","first-page":"154","DOI":"10.1049\/htl.2019.0063","volume":"6","author":"H Luo","year":"2019","unstructured":"Luo, H., Hu, Q., Jia, F.: Details preserved unsupervised depth estimation by fusing traditional stereo knowledge from laparoscopic images. Healthc. Technol. Lett. 6(6), 154\u2013158 (2019)","journal-title":"Healthc. Technol. Lett."},{"key":"27_CR40","doi-asserted-by":"crossref","unstructured":"Ma, R., et al.: Colon10k: a benchmark for place recognition in colonoscopy. In: 2021 IEEE 18th International Symposium on Biomedical Imaging (ISBI), pp. 1279\u20131283. IEEE (2021)","DOI":"10.1109\/ISBI48211.2021.9433780"},{"key":"27_CR41","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2021.102100","volume":"72","author":"R Ma","year":"2021","unstructured":"Ma, R., et al.: RNNSLAM: reconstructing the 3D colon to visualize missing regions during a colonoscopy. Med. Image Anal. 72, 102100 (2021)","journal-title":"Med. Image Anal."},{"key":"27_CR42","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"72","DOI":"10.1007\/978-3-319-54057-3_7","volume-title":"Computer-Assisted and Robotic Endoscopy","author":"N Mahmoud","year":"2017","unstructured":"Mahmoud, N., et al.: ORBSLAM-based endoscope tracking and 3D reconstruction. In: Peters, T., et al. (eds.) CARE 2016. LNCS, vol. 10170, pp. 72\u201383. Springer, Cham (2017). https:\/\/doi.org\/10.1007\/978-3-319-54057-3_7"},{"key":"27_CR43","doi-asserted-by":"crossref","unstructured":"Nierengarten, M.B.: Colonoscopy remains the gold standard for screening despite recent tarnish: although a recent study seemed to indicate that colonoscopies are not as effective as once thought at detecting colorectal cancer, a closer look at the study clears the confusion (2023)","DOI":"10.1002\/cncr.34622"},{"key":"27_CR44","unstructured":"Oquab, M., et al.: DINOv2: learning robust visual features without supervision (2024)"},{"key":"27_CR45","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2021.102058","volume":"71","author":"KB Ozyoruk","year":"2021","unstructured":"Ozyoruk, K.B., et al.: EndoSLAM dataset and an unsupervised monocular visual odometry and depth estimation approach for endoscopic videos. Med. Image Anal. 71, 102058 (2021)","journal-title":"Med. Image Anal."},{"key":"27_CR46","doi-asserted-by":"crossref","unstructured":"Papadhimitri, T., Favaro, P.: Uncalibrated near-light photometric stereo (2014)","DOI":"10.5244\/C.28.128"},{"key":"27_CR47","unstructured":"Paszke, A., et\u00a0al.: PyTorch: an imperative style, high-performance deep learning library. Adv. Neural Inf. Process. Syst. 32 (2019)"},{"key":"27_CR48","doi-asserted-by":"crossref","unstructured":"Perez, E., Strub, F., de\u00a0Vries, H., Dumoulin, V., Courville, A.: Film: visual reasoning with a general conditioning layer (2017)","DOI":"10.1609\/aaai.v32i1.11671"},{"key":"27_CR49","doi-asserted-by":"crossref","unstructured":"Qi, X., Liao, R., Liu, Z., Urtasun, R., Jia, J.: GeoNet: geometric neural network for joint depth and surface normal estimation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 283\u2013291 (2018)","DOI":"10.1109\/CVPR.2018.00037"},{"key":"27_CR50","doi-asserted-by":"crossref","unstructured":"Ranftl, R., Bochkovskiy, A., Koltun, V.: Vision transformers for dense prediction. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision (ICCV), pp. 12179\u201312188, October 2021","DOI":"10.1109\/ICCV48922.2021.01196"},{"key":"27_CR51","unstructured":"Ranftl, R., Lasinger, K., Hafner, D., Schindler, K., Koltun, V.: Towards robust monocular depth estimation: mixing datasets for zero-shot cross-dataset transfer (2020)"},{"key":"27_CR52","unstructured":"Rau, A., et\u00a0al.: SimCol3D\u20133D reconstruction during colonoscopy challenge. arXiv preprint arXiv:2307.11261 (2023)"},{"issue":"4","key":"27_CR53","doi-asserted-by":"publisher","first-page":"7225","DOI":"10.1109\/LRA.2021.3095528","volume":"6","author":"D Recasens","year":"2021","unstructured":"Recasens, D., Lamarca, J., F\u00e1cil, J.M., Montiel, J., Civera, J.: Endo-depth-and-motion: reconstruction and tracking in endoscopic videos using depth networks and photometric constraints. IEEE Roboti. Autom. Lett. 6(4), 7225\u20137232 (2021)","journal-title":"IEEE Roboti. Autom. Lett."},{"key":"27_CR54","doi-asserted-by":"crossref","unstructured":"Rodriguez-Puigvert, J., et al.: LightDepth: single-view depth self-supervision from illumination decline (2023)","DOI":"10.1109\/ICCV51070.2023.01945"},{"key":"27_CR55","series-title":"LNCS","doi-asserted-by":"publisher","first-page":"130","DOI":"10.1007\/978-3-031-16437-8_13","volume-title":"MICCAI 2022","author":"J Rodriguez-Puigvert","year":"2022","unstructured":"Rodriguez-Puigvert, J., Recasens, D., Civera, J., Martinez-Cantin, R.: On the uncertain single-view depths in colonoscopies. In: Wang, L., Dou, Q., Fletcher, P.T., Speidel, S., Li, S. (eds.) MICCAI 2022. LNCS, vol. 13433, pp. 130\u2013140. Springer, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-031-16437-8_13"},{"key":"27_CR56","unstructured":"Romero, A., Ballas, N., Kahou, S.E., Chassang, A., Gatta, C., Bengio, Y.: FitNets: hints for thin deep nets. arXiv preprint arXiv:1412.6550 (2014)"},{"key":"27_CR57","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"234","DOI":"10.1007\/978-3-319-24574-4_28","volume-title":"Medical Image Computing and Computer-Assisted Intervention \u2013 MICCAI 2015","author":"O Ronneberger","year":"2015","unstructured":"Ronneberger, O., Fischer, P., Brox, T.: U-Net: convolutional networks for biomedical image segmentation. In: Navab, N., Hornegger, J., Wells, W.M., Frangi, A.F. (eds.) MICCAI 2015. LNCS, vol. 9351, pp. 234\u2013241. Springer, Cham (2015). https:\/\/doi.org\/10.1007\/978-3-319-24574-4_28"},{"key":"27_CR58","doi-asserted-by":"crossref","unstructured":"Rossi, M., Gheche, M.E., Kuhn, A., Frossard, P.: Joint graph-based depth refinement and normal estimation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 12154\u201312163 (2020)","DOI":"10.1109\/CVPR42600.2020.01217"},{"key":"27_CR59","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"137","DOI":"10.1007\/978-3-030-58598-3_9","volume-title":"Computer Vision \u2013 ECCV 2020","author":"H Santo","year":"2020","unstructured":"Santo, H., Waechter, M., Matsushita, Y.: Deep near-light photometric stereo for\u00a0spatially varying reflectances. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12353, pp. 137\u2013152. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58598-3_9"},{"issue":"5","key":"27_CR60","doi-asserted-by":"publisher","first-page":"824","DOI":"10.1109\/TPAMI.2008.132","volume":"31","author":"A Saxena","year":"2008","unstructured":"Saxena, A., Sun, M., Ng, A.Y.: Make3D: learning 3D scene structure from a single still image. IEEE Trans. Pattern Anal. Mach. Intell. 31(5), 824\u2013840 (2008)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"27_CR61","doi-asserted-by":"crossref","unstructured":"Scarzanella, M.V., Sugiura, T., Kaneko, T., Koto, S.: Deep monocular 3D reconstruction for assisted navigation in bronchoscopy. Int. J. Comput. Assist. Radiol. Surg. 12, 1089\u20131099 (2017). https:\/\/api.semanticscholar.org\/CorpusID:26313018","DOI":"10.1007\/s11548-017-1609-2"},{"key":"27_CR62","doi-asserted-by":"crossref","unstructured":"Smith, L.N., Topin, N.: Super-convergence: very fast training of neural networks using large learning rates. In: Artificial Intelligence and Machine Learning for Multi-domain Operations Applications, vol. 11006, pp. 369\u2013386. SPIE (2019)","DOI":"10.1117\/12.2520589"},{"key":"27_CR63","unstructured":"Vaswani, A., et al.: Attention is all you need. Adv. Neural Inf. Process. Syst. 30 (2017)"},{"key":"27_CR64","doi-asserted-by":"crossref","unstructured":"Wang, S., et al.: A surface-normal based neural framework for colonoscopy reconstruction (2023)","DOI":"10.1007\/978-3-031-34048-2_61"},{"key":"27_CR65","doi-asserted-by":"crossref","unstructured":"Widya, A.R., et al.: 3D reconstruction of whole stomach from endoscope video using structure-from-motion. In: 2019 41st Annual International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC), pp. 3900\u20133904. IEEE (2019)","DOI":"10.1109\/EMBC.2019.8857964"},{"key":"27_CR66","doi-asserted-by":"crossref","unstructured":"Xu, D., Ricci, E., Ouyang, W., Wang, X., Sebe, N.: Multi-scale continuous CRFs as sequential deep networks for monocular depth estimation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 5354\u20135362 (2017)","DOI":"10.1109\/CVPR.2017.25"},{"key":"27_CR67","doi-asserted-by":"crossref","unstructured":"Yang, L., Kang, B., Huang, Z., Xu, X., Feng, J., Zhao, H.: Depth anything: unleashing the power of large-scale unlabeled data (2024)","DOI":"10.1109\/CVPR52733.2024.00987"},{"key":"27_CR68","series-title":"LNCS","doi-asserted-by":"publisher","first-page":"266","DOI":"10.1007\/978-3-031-19769-7_16","volume-title":"ECCV 2022","author":"W Yang","year":"2022","unstructured":"Yang, W., Chen, G., Chen, C., Chen, Z., Wong, K.Y.K.: PS-NeRF: neural inverse rendering for multi-view photometric stereo. In: Avidan, S., Brostow, G., Ciss\u00e9, M., Farinella, G.M., Hassner, T. (eds.) ECCV 2022. LNCS, vol. 13661, pp. 266\u2013284. Springer, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-031-19769-7_16"},{"key":"27_CR69","unstructured":"Zagoruyko, S., Komodakis, N.: Paying more attention to attention: improving the performance of convolutional neural networks via attention transfer. arXiv preprint arXiv:1612.03928 (2016)"},{"key":"27_CR70","unstructured":"Zhang, Y., Frahm, J.M., Ehrenstein, S., McGill, S.K., Rosenman, J.G., Wang, S., Pizer, S.M.: CoLDE: a depth estimation framework for colonoscopy reconstruction (2021)"},{"key":"27_CR71","doi-asserted-by":"crossref","unstructured":"Zhao, D., Lichy, D., Perrin, P.N., Frahm, J.M., Sengupta, S.: MVPSNet: fast generalizable multi-view photometric stereo. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 12525\u201312536 (2023)","DOI":"10.1109\/ICCV51070.2023.01151"},{"key":"27_CR72","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"439","DOI":"10.1007\/978-3-319-46720-7_51","volume-title":"Medical Image Computing and Computer-Assisted Intervention \u2013 MICCAI 2016","author":"Q Zhao","year":"2016","unstructured":"Zhao, Q., Price, T., Pizer, S., Niethammer, M., Alterovitz, R., Rosenman, J.: The endoscopogram: a 3D model reconstructed from endoscopic video frames. In: Ourselin, S., Joskowicz, L., Sabuncu, M.R., Unal, G., Wells, W. (eds.) MICCAI 2016. LNCS, vol. 9900, pp. 439\u2013447. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46720-7_51"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2024"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-73411-3_27","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,22]],"date-time":"2024-11-22T21:28:21Z","timestamp":1732310901000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-73411-3_27"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,23]]},"ISBN":["9783031734106","9783031734113"],"references-count":72,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-73411-3_27","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,11,23]]},"assertion":[{"value":"23 November 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Milan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2024.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}