{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,11]],"date-time":"2026-03-11T01:41:26Z","timestamp":1773193286680,"version":"3.50.1"},"reference-count":199,"publisher":"Springer Science and Business Media LLC","issue":"11","license":[{"start":{"date-parts":[[2022,11,17]],"date-time":"2022-11-17T00:00:00Z","timestamp":1668643200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2022,11,17]],"date-time":"2022-11-17T00:00:00Z","timestamp":1668643200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100005710","name":"Universiti Teknologi Petronas","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100005710","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Vis Comput"],"published-print":{"date-parts":[[2023,11]]},"DOI":"10.1007\/s00371-022-02702-z","type":"journal-article","created":{"date-parts":[[2022,11,17]],"date-time":"2022-11-17T13:03:53Z","timestamp":1668690233000},"page":"5897-5924","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":10,"title":["A review on monocular tracking and mapping: from model-based to data-driven methods"],"prefix":"10.1007","volume":"39","author":[{"given":"Nivesh","family":"Gadipudi","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4721-9400","authenticated-orcid":false,"given":"Irraivan","family":"Elamvazuthi","sequence":"additional","affiliation":[]},{"given":"Lila Iznita","family":"Izhar","sequence":"additional","affiliation":[]},{"given":"Lokender","family":"Tiwari","sequence":"additional","affiliation":[]},{"given":"Ramya","family":"Hebbalaguppe","sequence":"additional","affiliation":[]},{"given":"Cheng-Kai","family":"Lu","sequence":"additional","affiliation":[]},{"given":"Arockia Selvakumar Arockia","family":"Doss","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,11,17]]},"reference":[{"key":"2702_CR1","doi-asserted-by":"crossref","unstructured":"Nourani-Vatani, N., Roberts, J., Srinivasan, M.V.: Practical visual odometry for car-like vehicles. In: 2009 IEEE International Conference on Robotics and Automation, pp. 3551\u20133557 (2009). IEEE","DOI":"10.1109\/ROBOT.2009.5152403"},{"key":"2702_CR2","unstructured":"Helmick, D.M., Cheng, Y., Clouse, D.S., Matthies, L.H., Roumeliotis, S.I.: Path following using visual odometry for a mars rover in high-slip environments. In: 2004 IEEE Aerospace Conference Proceedings (IEEE Cat. No. 04TH8720), Vol. 2, pp. 772\u2013789 (2004). IEEE"},{"key":"2702_CR3","unstructured":"Woodman, O.J.: An introduction to inertial navigation. Technical report, University of Cambridge, Computer Laboratory (2007)"},{"key":"2702_CR4","doi-asserted-by":"publisher","first-page":"419","DOI":"10.1016\/j.jvcir.2017.03.015","volume":"48","author":"W Jiang","year":"2017","unstructured":"Jiang, W., Yin, Z.: Combining passive visual cameras and active imu sensors for persistent pedestrian tracking. J. Vis. Commun. Image Represent. 48, 419\u2013431 (2017). https:\/\/doi.org\/10.1016\/j.jvcir.2017.03.015","journal-title":"J. Vis. Commun. Image Represent."},{"issue":"1","key":"2702_CR5","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s40064-016-3573-7","volume":"5","author":"MO Aqel","year":"2016","unstructured":"Aqel, M.O., Marhaban, M.H., Saripan, M.I., Ismail, N.B.: Review of visual odometry: types, approaches, challenges, and applications. Springerplus 5(1), 1\u201326 (2016). https:\/\/doi.org\/10.1186\/s40064-016-3573-7","journal-title":"Springerplus"},{"issue":"7","key":"2702_CR6","doi-asserted-by":"publisher","first-page":"2068","DOI":"10.3390\/s20072068","volume":"20","author":"C Debeunne","year":"2020","unstructured":"Debeunne, C., Vivet, D.: A review of visual-lidar fusion based simultaneous localization and mapping. Sensors 20(7), 2068 (2020). https:\/\/doi.org\/10.3390\/s20072068","journal-title":"Sensors"},{"key":"2702_CR7","doi-asserted-by":"crossref","unstructured":"Zaffar, M., Ehsan, S., Stolkin, R., Maier, K.M.: Sensors, slam and long-term autonomy: a review. In: 2018 NASA\/ESA Conference on Adaptive Hardware and Systems (AHS), pp. 285\u2013290 (2018). IEEE","DOI":"10.1109\/AHS.2018.8541483"},{"key":"2702_CR8","doi-asserted-by":"publisher","first-page":"289","DOI":"10.1007\/s40903-015-0032-7","volume":"1","author":"K Yousif","year":"2015","unstructured":"Yousif, K., Bab-Hadiashar, A., Hoseinnezhad, R.: An overview to visual odometry and visual slam: applications to mobile robotics. Intell. Ind. Syst. 1, 289\u2013311 (2015)","journal-title":"Intell. Ind. Syst."},{"key":"2702_CR9","doi-asserted-by":"crossref","unstructured":"Younes, G., Asmar, D.C., Shammas, E.: A survey on non-filter-based monocular visual slam systems. arXiv:1607.00470 (2016)","DOI":"10.15353\/vsnl.v2i1.109"},{"key":"2702_CR10","doi-asserted-by":"publisher","first-page":"67","DOI":"10.1016\/j.robot.2017.09.010","volume":"98","author":"G Younes","year":"2017","unstructured":"Younes, G., Asmar, D., Shammas, E., Zelek, J.: Keyframe-based monocular slam: design, survey, and future directions. Robot. Auton. Syst. 98, 67\u201388 (2017). https:\/\/doi.org\/10.1016\/j.robot.2017.09.010","journal-title":"Robot. Auton. Syst."},{"issue":"6","key":"2702_CR11","doi-asserted-by":"publisher","first-page":"1052","DOI":"10.1109\/TPAMI.2007.1049","volume":"29","author":"AJ Davison","year":"2007","unstructured":"Davison, A.J., Reid, I.D., Molton, N.D., Stasse, O.: Monoslam: real-time single camera slam. IEEE Trans. Pattern Anal. Mach. Intell. 29(6), 1052\u20131067 (2007). https:\/\/doi.org\/10.1109\/TPAMI.2007.1049","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"2702_CR12","doi-asserted-by":"crossref","unstructured":"Triggs, B., McLauchlan, P.F., Hartley, R.I., Fitzgibbon, A.W.: Bundle adjustment-a modern synthesis. In: International Workshop on Vision Algorithms, pp. 298\u2013372 (1999). Springer","DOI":"10.1007\/3-540-44480-7_21"},{"key":"2702_CR13","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1145\/3065386","volume":"60","author":"A Krizhevsky","year":"2012","unstructured":"Krizhevsky, A., Sutskever, I., Hinton, G.E.: Imagenet classification with deep convolutional neural networks. Commun. ACM 60, 84\u201390 (2012)","journal-title":"Commun. ACM"},{"issue":"2","key":"2702_CR14","doi-asserted-by":"publisher","first-page":"99","DOI":"10.1109\/MRA.2006.1638022","volume":"13","author":"H Durrant-Whyte","year":"2006","unstructured":"Durrant-Whyte, H., Bailey, T.: Simultaneous localization and mapping: part I. IEEE Robot. Autom. Mag. 13(2), 99\u2013110 (2006). https:\/\/doi.org\/10.1109\/MRA.2006.1638022","journal-title":"IEEE Robot. Autom. Mag."},{"key":"2702_CR15","doi-asserted-by":"crossref","unstructured":"Nist\u00e9r, D., Naroditsky, O., Bergen, J.R.: Visual odometry. In; Proceedings of the 2004 IEEE Computer Society Conference on Computer Vision and Pattern Recognition, 2004. CVPR 2004. Vol. 1, (2004)","DOI":"10.1109\/CVPR.2004.1315094"},{"key":"2702_CR16","doi-asserted-by":"publisher","first-page":"486","DOI":"10.1631\/jzus.CIDE1302","volume":"14","author":"Y Wei","year":"2013","unstructured":"Wei, Y., Kang, L., Yang, B., Wu, L.: Applications of structure from motion: a survey. J. Zhejiang Univ. Sci. C 14, 486\u2013494 (2013). https:\/\/doi.org\/10.1631\/jzus.CIDE1302","journal-title":"J. Zhejiang Univ. Sci. C"},{"key":"2702_CR17","doi-asserted-by":"crossref","unstructured":"Song, S., Chandraker, M.: Robust scale estimation in real-time monocular sfm for autonomous driving. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1566\u20131573 (2014)","DOI":"10.1109\/CVPR.2014.203"},{"issue":"2","key":"2702_CR18","doi-asserted-by":"publisher","first-page":"791","DOI":"10.1109\/TITS.2019.2900330","volume":"21","author":"D Zhou","year":"2019","unstructured":"Zhou, D., Dai, Y., Li, H.: Ground-plane-based absolute scale estimation for monocular visual odometry. IEEE Trans. Intell. Transp. Syst. 21(2), 791\u2013802 (2019). https:\/\/doi.org\/10.1109\/TITS.2019.2900330","journal-title":"IEEE Trans. Intell. Transp. Syst."},{"issue":"5","key":"2702_CR19","doi-asserted-by":"publisher","first-page":"1053","DOI":"10.1007\/s00371-019-01714-6","volume":"36","author":"M He","year":"2020","unstructured":"He, M., Zhu, C., Huang, Q., Ren, B., Liu, J.: A review of monocular visual odometry. Vis. Comput. 36(5), 1053\u20131065 (2020). https:\/\/doi.org\/10.1007\/s00371-019-01714-6","journal-title":"Vis. Comput."},{"key":"2702_CR20","doi-asserted-by":"crossref","unstructured":"Milz, S., Arbeiter, G., Witt, C., Abdallah, B., Yogamani, S.: Visual slam for automated driving: Exploring the applications of deep learning. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition Workshops, pp. 247\u2013257 (2018)","DOI":"10.1109\/CVPRW.2018.00062"},{"issue":"1","key":"2702_CR21","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s11548-016-1444-x","volume":"12","author":"N Mahmoud","year":"2017","unstructured":"Mahmoud, N., Grasa, \u00d3.G., Nicolau, S.A., Doignon, C., Soler, L., Marescaux, J., Montiel, J.: On-patient see-through augmented reality based on visual slam. Int. J. Comput. Assist. Radiol. Surg. 12(1), 1\u201311 (2017)","journal-title":"Int. J. Comput. Assist. Radiol. Surg."},{"issue":"10","key":"2702_CR22","doi-asserted-by":"publisher","first-page":"2051","DOI":"10.1007\/s00371-020-01911-8","volume":"36","author":"K Yu","year":"2020","unstructured":"Yu, K., Ahn, J., Lee, J., Kim, M., Han, J.: Collaborative slam and ar-guided navigation for floor layout inspection. Vis. Comput. 36(10), 2051\u20132063 (2020)","journal-title":"Vis. Comput."},{"issue":"1","key":"2702_CR23","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s003710100122","volume":"18","author":"\u00c9 Marchand","year":"2002","unstructured":"Marchand, \u00c9., Courty, N.: Controlling a camera in a virtual environment. Vis. Comput. 18(1), 1\u201319 (2002)","journal-title":"Vis. Comput."},{"issue":"1","key":"2702_CR24","doi-asserted-by":"publisher","first-page":"135","DOI":"10.1109\/TMI.2013.2282997","volume":"33","author":"OG Grasa","year":"2013","unstructured":"Grasa, O.G., Bernal, E., Casado, S., Gil, I., Montiel, J.: Visual slam for handheld monocular endoscope. IEEE Trans. Med. Imaging 33(1), 135\u2013146 (2013). https:\/\/doi.org\/10.1109\/TMI.2013.2282997","journal-title":"IEEE Trans. Med. Imaging"},{"issue":"5","key":"2702_CR25","doi-asserted-by":"publisher","first-page":"1438","DOI":"10.1109\/TMI.2019.2950936","volume":"39","author":"X Liu","year":"2019","unstructured":"Liu, X., Sinha, A., Ishii, M., Hager, G.D., Reiter, A., Taylor, R.H., Unberath, M.: Dense depth estimation in monocular endoscopy with self-supervised learning methods. IEEE Trans. Med. Imaging 39(5), 1438\u20131447 (2019). https:\/\/doi.org\/10.1109\/TMI.2019.2950936","journal-title":"IEEE Trans. Med. Imaging"},{"issue":"6","key":"2702_CR26","doi-asserted-by":"publisher","first-page":"580","DOI":"10.1109\/34.601246","volume":"19","author":"RI Hartley","year":"1997","unstructured":"Hartley, R.I.: In defense of the eight-point algorithm. IEEE Trans. Pattern Anal. Mach. Intell. 19(6), 580\u2013593 (1997). https:\/\/doi.org\/10.1109\/34.601246","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"2","key":"2702_CR27","doi-asserted-by":"publisher","first-page":"161","DOI":"10.1023\/A:1007941100561","volume":"27","author":"Z Zhang","year":"1998","unstructured":"Zhang, Z.: Determining the epipolar geometry and its uncertainty: a review. Int. J. Comput. Vision 27(2), 161\u2013195 (1998). https:\/\/doi.org\/10.1023\/A:1007941100561","journal-title":"Int. J. Comput. Vision"},{"key":"2702_CR28","doi-asserted-by":"publisher","first-page":"22","DOI":"10.1016\/j.neucom.2021.09.029","volume":"467","author":"R Zhu","year":"2022","unstructured":"Zhu, R., Yang, M., Liu, W., Song, R., Yan, B., Xiao, Z.: Deepavo: Efficient pose refining with feature distilling for deep visual odometry. Neurocomputing 467, 22\u201335 (2022). https:\/\/doi.org\/10.1016\/j.neucom.2021.09.029","journal-title":"Neurocomputing"},{"issue":"3","key":"2702_CR29","doi-asserted-by":"publisher","first-page":"108","DOI":"10.1109\/MRA.2006.1678144","volume":"13","author":"T Bailey","year":"2006","unstructured":"Bailey, T., Durrant-Whyte, H.: Simultaneous localization and mapping (slam): part II. IEEE Robot. Autom. Mag. 13(3), 108\u2013117 (2006). https:\/\/doi.org\/10.1109\/MRA.2006.1678144","journal-title":"IEEE Robot. Autom. Mag."},{"issue":"4","key":"2702_CR30","doi-asserted-by":"publisher","first-page":"80","DOI":"10.1109\/MRA.2011.943233","volume":"18","author":"D Scaramuzza","year":"2011","unstructured":"Scaramuzza, D., Fraundorfer, F.: Visual odometry [tutorial]. IEEE Robot. Autom. Mag. 18(4), 80\u201392 (2011). https:\/\/doi.org\/10.1109\/MRA.2011.943233","journal-title":"IEEE Robot. Autom. Mag."},{"issue":"2","key":"2702_CR31","doi-asserted-by":"publisher","first-page":"78","DOI":"10.1109\/MRA.2012.2182810","volume":"19","author":"F Fraundorfer","year":"2012","unstructured":"Fraundorfer, F., Scaramuzza, D.: Visual odometry: part II: matching, robustness, optimization, and applications. IEEE Robot. Autom. Mag. 19(2), 78\u201390 (2012). https:\/\/doi.org\/10.1109\/MRA.2012.2182810","journal-title":"IEEE Robot. Autom. Mag."},{"key":"2702_CR32","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s41074-017-0027-2","volume":"9","author":"T Taketomi","year":"2017","unstructured":"Taketomi, T., Uchiyama, H., Ikeda, S.: Visual slam algorithms: a survey from 2010 to 2016. IPSJ Trans. Comput. Vis. Appl. 9, 1\u201311 (2017). https:\/\/doi.org\/10.1186\/s41074-017-0027-2","journal-title":"IPSJ Trans. Comput. Vis. Appl."},{"key":"2702_CR33","doi-asserted-by":"publisher","first-page":"875","DOI":"10.1007\/s12559-018-9591-8","volume":"10","author":"R Li","year":"2018","unstructured":"Li, R., Wang, S., Gu, D.: Ongoing evolution of visual slam from geometry to deep learning: challenges and opportunities. Cogn. Comput. 10, 875\u2013889 (2018). https:\/\/doi.org\/10.1007\/s12559-018-9591-8","journal-title":"Cogn. Comput."},{"key":"2702_CR34","doi-asserted-by":"publisher","DOI":"10.1016\/j.engappai.2020.104032","volume":"97","author":"H Taheri","year":"2021","unstructured":"Taheri, H., Xia, Z.C.: Slam; definition and evolution. Eng. Appl. Artif. Intell. 97, 104032 (2021). https:\/\/doi.org\/10.1016\/j.engappai.2020.104032","journal-title":"Eng. Appl. Artif. Intell."},{"key":"2702_CR35","doi-asserted-by":"publisher","first-page":"1309","DOI":"10.1109\/TRO.2016.2624754","volume":"32","author":"C Cadena","year":"2016","unstructured":"Cadena, C., Carlone, L., Carrillo, H., Latif, Y., Scaramuzza, D., Neira, J., Reid, I., Leonard, J.: Past, present, and future of simultaneous localization and mapping: toward the robust-perception age. IEEE Trans. Robot. 32, 1309\u20131332 (2016). https:\/\/doi.org\/10.1109\/TRO.2016.2624754","journal-title":"IEEE Trans. Robot."},{"key":"2702_CR36","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3177853","volume":"51","author":"MRU Saputra","year":"2018","unstructured":"Saputra, M.R.U., Markham, A., Trigoni, A.: Visual slam and structure from motion in dynamic environments. ACM Comput. Surv. 51, 1\u201336 (2018). https:\/\/doi.org\/10.1145\/3177853","journal-title":"ACM Comput. Surv."},{"key":"2702_CR37","doi-asserted-by":"publisher","first-page":"439","DOI":"10.1016\/j.isprsjprs.2021.11.007","volume":"183","author":"J Pan","year":"2022","unstructured":"Pan, J., Li, L., Yamaguchi, H., Hasegawa, K., Thufail, F.I., Tanaka, S., et al.: 3d reconstruction of borobudur reliefs from 2d monocular photographs based on soft-edge enhanced deep learning. ISPRS J. Photogramm. Remote. Sens. 183, 439\u2013450 (2022). https:\/\/doi.org\/10.1016\/j.isprsjprs.2021.11.007","journal-title":"ISPRS J. Photogramm. Remote. Sens."},{"key":"2702_CR38","doi-asserted-by":"crossref","unstructured":"Davison, A.J.: Real-time simultaneous localisation and mapping with a single camera. In: IEEE International Conference on Computer Vision, vol. 3, pp. 1403\u20131403 (2003). IEEE Computer Society","DOI":"10.1109\/ICCV.2003.1238654"},{"issue":"5","key":"2702_CR39","doi-asserted-by":"publisher","first-page":"1147","DOI":"10.1109\/TRO.2015.2463671","volume":"31","author":"R Mur-Artal","year":"2015","unstructured":"Mur-Artal, R., Montiel, J.M.M., Tardos, J.D.: Orb-slam: a versatile and accurate monocular slam system. IEEE Trans. Robot. 31(5), 1147\u20131163 (2015). https:\/\/doi.org\/10.1109\/TRO.2015.2463671","journal-title":"IEEE Trans. Robot."},{"issue":"6","key":"2702_CR40","doi-asserted-by":"publisher","first-page":"899","DOI":"10.1007\/s00371-018-1523-9","volume":"34","author":"Y Liu","year":"2018","unstructured":"Liu, Y., Chen, X., Gu, T., Zhang, Y., Xing, G.: Real-time camera pose estimation via line tracking. Vis. Comput. 34(6), 899\u2013909 (2018)","journal-title":"Vis. Comput."},{"key":"2702_CR41","doi-asserted-by":"crossref","unstructured":"Maity, S., Saha, A., Bhowmick, B.: Edge slam: Edge points based monocular visual slam. In: Proceedings of the IEEE International Conference on Computer Vision Workshops, pp. 2408\u20132417 (2017)","DOI":"10.1109\/ICCVW.2017.284"},{"key":"2702_CR42","unstructured":"Dong, Y., Wang, S., Yue, J., Chen, C., He, S., Wang, H., He, B.: A novel texture-less object oriented visual slam system. IEEE Trans. Intell. Transp. Syst. (2019)"},{"issue":"4","key":"2702_CR43","doi-asserted-by":"publisher","first-page":"925","DOI":"10.1109\/TRO.2019.2909168","volume":"35","author":"S Yang","year":"2019","unstructured":"Yang, S., Scherer, S.: Cubeslam: monocular 3-d object slam. IEEE Trans. Robot. 35(4), 925\u2013938 (2019). https:\/\/doi.org\/10.1109\/TRO.2019.2909168","journal-title":"IEEE Trans. Robot."},{"key":"2702_CR44","doi-asserted-by":"crossref","unstructured":"Tuytelaars, T., Mikolajczyk, K.: Local Invariant Feature Detectors: a Survey. Now Publishers Inc, (2008)","DOI":"10.1561\/9781601981394"},{"key":"2702_CR45","doi-asserted-by":"publisher","first-page":"736","DOI":"10.1016\/j.neucom.2014.08.003","volume":"149","author":"Y Li","year":"2015","unstructured":"Li, Y., Wang, S., Tian, Q., Ding, X.: A survey of recent advances in visual feature detection. Neurocomputing 149, 736\u2013751 (2015). https:\/\/doi.org\/10.1016\/j.neucom.2014.08.003","journal-title":"Neurocomputing"},{"key":"2702_CR46","doi-asserted-by":"publisher","first-page":"679","DOI":"10.1109\/TPAMI.1986.4767851","volume":"6","author":"J Canny","year":"1986","unstructured":"Canny, J.: A computational approach to edge detection. IEEE Trans. Pattern Anal. Mach. Intell. 6, 679\u2013698 (1986). https:\/\/doi.org\/10.1109\/TPAMI.1986.4767851","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"2702_CR47","doi-asserted-by":"crossref","unstructured":"Harris, C.G., Stephens, M., et al.: A combined corner and edge detector. In: Alvey Vision Conference, vol. 15, pp. 10\u20135244 (1988). Citeseer","DOI":"10.5244\/C.2.23"},{"key":"2702_CR48","unstructured":"Shi, J., et al.: Good features to track. In: 1994 Proceedings of IEEE Conference on Computer Vision and Pattern Recognition, pp. 593\u2013600 (1994). IEEE"},{"issue":"5","key":"2702_CR49","doi-asserted-by":"publisher","first-page":"1094","DOI":"10.1109\/TRO.2008.2004637","volume":"24","author":"P Pini\u00e9s","year":"2008","unstructured":"Pini\u00e9s, P., Tard\u00f3s, J.D.: Large-scale slam building conditionally independent local maps: application to monocular vision. IEEE Trans. Rob. 24(5), 1094\u20131106 (2008). https:\/\/doi.org\/10.1109\/TRO.2008.2004637","journal-title":"IEEE Trans. Rob."},{"key":"2702_CR50","doi-asserted-by":"crossref","unstructured":"Kwon, J., Lee, K.M.: Monocular slam with locally planar landmarks via geometric rao-blackwellized particle filtering on lie groups. In: 2010 IEEE Computer Society Conference on Computer Vision and Pattern Recognition, pp. 1522\u20131529 (2010). IEEE","DOI":"10.1109\/CVPR.2010.5539789"},{"key":"2702_CR51","doi-asserted-by":"crossref","unstructured":"Clemente, L.A., Davison, A.J., Reid, I.D., Neira, J., Tard\u00f3s, J.D.: Mapping large loops with a single hand-held camera. In: Robotics: Science and Systems, vol. 2 (2007)","DOI":"10.15607\/RSS.2007.III.038"},{"issue":"7","key":"2702_CR52","doi-asserted-by":"publisher","first-page":"1251","DOI":"10.1109\/TPAMI.2008.189","volume":"31","author":"SA Holmes","year":"2008","unstructured":"Holmes, S.A., Klein, G., Murray, D.W.: An o (n$$^2$$) square root unscented kalman filter for visual simultaneous localization and mapping. IEEE Trans. Pattern Anal. Mach. Intell. 31(7), 1251\u20131263 (2008). https:\/\/doi.org\/10.1109\/TPAMI.2008.189","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"2702_CR53","doi-asserted-by":"crossref","unstructured":"Celik, K., Chung, S.-J., Clausman, M., Somani, A.K.: Monocular vision slam for indoor aerial vehicles. In: 2009 IEEE\/RSJ International Conference on Intelligent Robots and Systems, pp. 1566\u20131573 (2009). IEEE","DOI":"10.1109\/IROS.2009.5354050"},{"key":"2702_CR54","doi-asserted-by":"publisher","first-page":"269","DOI":"10.1016\/j.neucom.2014.05.034","volume":"145","author":"J Liu","year":"2014","unstructured":"Liu, J., Liu, D., Cheng, J., Tang, Y.: Conditional simultaneous localization and mapping: a robust visual slam system. Neurocomputing 145, 269\u2013284 (2014). https:\/\/doi.org\/10.1016\/j.neucom.2014.05.034","journal-title":"Neurocomputing"},{"issue":"2","key":"2702_CR55","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1023\/B:VISI.0000029664.99615.94","volume":"60","author":"DG Lowe","year":"2004","unstructured":"Lowe, D.G.: Distinctive image features from scale-invariant keypoints. Int. J. Comput. Vis. 60(2), 91\u2013110 (2004). https:\/\/doi.org\/10.1023\/B:VISI.0000029664.99615.94","journal-title":"Int. J. Comput. Vis."},{"key":"2702_CR56","doi-asserted-by":"crossref","unstructured":"Rosten, E., Drummond, T.: Machine learning for high-speed corner detection. In: European Conference on Computer Vision, pp. 430\u2013443 (2006). Springer","DOI":"10.1007\/11744023_34"},{"key":"2702_CR57","doi-asserted-by":"crossref","unstructured":"Klein, G., Murray, D.: Parallel tracking and mapping for small ar workspaces. In: 2007 6th IEEE and ACM International Symposium on Mixed and Augmented Reality, pp. 225\u2013234 (2007). IEEE","DOI":"10.1109\/ISMAR.2007.4538852"},{"key":"2702_CR58","doi-asserted-by":"crossref","unstructured":"Herrera, D.C., Kim, K., Kannala, J., Pulli, K., Heikkil\u00e4, J.: Dt-slam: Deferred triangulation for robust slam. In: 2014 2nd International Conference on 3D Vision, vol. 1, pp. 609\u2013616 (2014). IEEE","DOI":"10.1109\/3DV.2014.49"},{"key":"2702_CR59","doi-asserted-by":"crossref","unstructured":"Pumarola, A., Vakhitov, A., Agudo, A., Sanfeliu, A., Moreno-Noguer, F.: Pl-slam: Real-time monocular visual slam with points and lines. In: 2017 IEEE International Conference on Robotics and Automation (ICRA), pp. 4503\u20134508 (2017). IEEE","DOI":"10.1109\/ICRA.2017.7989522"},{"issue":"1","key":"2702_CR60","doi-asserted-by":"publisher","first-page":"23","DOI":"10.1007\/s11263-020-01359-2","volume":"129","author":"J Ma","year":"2021","unstructured":"Ma, J., Jiang, X., Fan, A., Jiang, J., Yan, J.: Image matching from handcrafted to deep features: a survey. Int. J. Comput. Vis. 129(1), 23\u201379 (2021). https:\/\/doi.org\/10.1007\/s11263-020-01359-2","journal-title":"Int. J. Comput. Vis."},{"issue":"1","key":"2702_CR61","doi-asserted-by":"publisher","first-page":"58","DOI":"10.1080\/10095020.2020.1843376","volume":"24","author":"L Chen","year":"2021","unstructured":"Chen, L., Rottensteiner, F., Heipke, C.: Feature detection and description for image matching: from hand-crafted design to deep learning. Geo-Spatial Inf. Sci. 24(1), 58\u201374 (2021). https:\/\/doi.org\/10.1080\/10095020.2020.1843376","journal-title":"Geo-Spatial Inf. Sci."},{"key":"2702_CR62","doi-asserted-by":"crossref","unstructured":"Martins, P.F., Costelha, H., Bento, L.C., Neves, C.: Monocular camera calibration for autonomous driving-a comparative study. In: 2020 IEEE International Conference on Autonomous Robot Systems and Competitions (ICARSC), pp. 306\u2013311 (2020). IEEE","DOI":"10.1109\/ICARSC49921.2020.9096104"},{"issue":"6","key":"2702_CR63","doi-asserted-by":"publisher","first-page":"756","DOI":"10.1109\/TPAMI.2004.17","volume":"26","author":"D Nist\u00e9r","year":"2004","unstructured":"Nist\u00e9r, D.: An efficient solution to the five-point relative pose problem. IEEE Trans. Pattern Anal. Mach. Intell. 26(6), 756\u2013770 (2004). https:\/\/doi.org\/10.1109\/TPAMI.2004.17","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"2","key":"2702_CR64","doi-asserted-by":"publisher","first-page":"205","DOI":"10.1016\/S0262-8856(02)00154-3","volume":"21","author":"X Armangu\u00e9","year":"2003","unstructured":"Armangu\u00e9, X., Salvi, J.: Overall view regarding fundamental matrix estimation. Image Vis. Comput. 21(2), 205\u2013220 (2003). https:\/\/doi.org\/10.1016\/S0262-8856(02)00154-3","journal-title":"Image Vis. Comput."},{"issue":"2","key":"2702_CR65","doi-asserted-by":"crossref","first-page":"117","DOI":"10.1007\/s11263-006-0005-0","volume":"74","author":"V Lui","year":"2007","unstructured":"Lui, V., Drummond, T.: An iterative 5-pt algorithm for fast and robust essential matrix estimation. IJCV 74(2), 117\u2013136 (2007)","journal-title":"IJCV"},{"issue":"6","key":"2702_CR66","doi-asserted-by":"publisher","first-page":"381","DOI":"10.1145\/358669.358692","volume":"24","author":"MA Fischler","year":"1981","unstructured":"Fischler, M.A., Bolles, R.C.: Random sample consensus: a paradigm for model fitting with applications to image analysis and automated cartography. Commun. ACM 24(6), 381\u2013395 (1981). https:\/\/doi.org\/10.1145\/358669.358692","journal-title":"Commun. ACM"},{"issue":"1","key":"2702_CR67","doi-asserted-by":"publisher","first-page":"138","DOI":"10.1006\/cviu.1999.0832","volume":"78","author":"PH Torr","year":"2000","unstructured":"Torr, P.H., Zisserman, A.: Mlesac: a new robust estimator with application to estimating image geometry. Comput. Vis. Image Underst. 78(1), 138\u2013156 (2000). https:\/\/doi.org\/10.1006\/cviu.1999.0832","journal-title":"Comput. Vis. Image Underst."},{"key":"2702_CR68","doi-asserted-by":"publisher","first-page":"147523","DOI":"10.1109\/ACCESS.2019.2946387","volume":"7","author":"K Yan","year":"2019","unstructured":"Yan, K., Zhao, R., Liu, E., Ma, Y.: A robust fundamental matrix estimation method based on epipolar geometric error criterion. IEEE Access 7, 147523\u2013147533 (2019). https:\/\/doi.org\/10.1109\/ACCESS.2019.2946387","journal-title":"IEEE Access"},{"key":"2702_CR69","volume-title":"Multiple View Geometry in Computer Vision","author":"R Hartley","year":"2003","unstructured":"Hartley, R., Zisserman, A.: Multiple View Geometry in Computer Vision, 2nd edn. Cambridge University Press, New York (2003)","edition":"2"},{"key":"2702_CR70","doi-asserted-by":"crossref","unstructured":"Forster, C., Pizzoli, M., Scaramuzza, D.: Svo: Fast semi-direct monocular visual odometry. In: 2014 IEEE International Conference on Robotics and Automation (ICRA), pp. 15\u201322 (2014). IEEE","DOI":"10.1109\/ICRA.2014.6906584"},{"key":"2702_CR71","doi-asserted-by":"crossref","unstructured":"Huang, J., Liu, R., Zhang, J., Chen, S.: Fast initialization method for monocular slam based on indoor model. In: 2017 IEEE International Conference on Robotics and Biomimetics (ROBIO), pp. 2360\u20132365 (2017). IEEE","DOI":"10.1109\/ROBIO.2017.8324772"},{"key":"2702_CR72","doi-asserted-by":"publisher","first-page":"8176489","DOI":"10.1155\/2019\/8176489","volume":"2019","author":"Y Yang","year":"2019","unstructured":"Yang, Y., Xiong, J., She, X., Liu, C., Yang, C., Li, J.: Passive initialization method based on motion characteristics for monocular slam. Complexity 2019, 8176489\u20131817648911 (2019). https:\/\/doi.org\/10.1155\/2019\/8176489","journal-title":"Complexity"},{"key":"2702_CR73","doi-asserted-by":"crossref","unstructured":"Strasdat, H., Montiel, J., Davison, A.J.: Real-time monocular slam: Why filter? In: 2010 IEEE International Conference on Robotics and Automation, pp. 2657\u20132664 (2010). IEEE","DOI":"10.1109\/ROBOT.2010.5509636"},{"key":"2702_CR74","doi-asserted-by":"crossref","unstructured":"Ho, T.S., Fai, Y.C., Ming, E.S.L.: Simultaneous localization and mapping survey based on filtering techniques. In: 2015 10th Asian Control Conference (ASCC), pp. 1\u20136 (2015). IEEE","DOI":"10.1109\/ASCC.2015.7244836"},{"issue":"5","key":"2702_CR75","doi-asserted-by":"publisher","first-page":"1036","DOI":"10.1109\/TRO.2007.903811","volume":"23","author":"S Huang","year":"2007","unstructured":"Huang, S., Dissanayake, G.: Convergence and consistency analysis for extended Kalman filter based slam. IEEE Trans. Robot. 23(5), 1036\u20131049 (2007). https:\/\/doi.org\/10.1109\/TRO.2007.903811","journal-title":"IEEE Trans. Robot."},{"issue":"3","key":"2702_CR76","doi-asserted-by":"publisher","first-page":"242","DOI":"10.1109\/70.938382","volume":"17","author":"JE Guivant","year":"2001","unstructured":"Guivant, J.E., Nebot, E.M.: Optimization of the simultaneous localization and map-building algorithm for real-time implementation. IEEE Trans. Robot. Autom. 17(3), 242\u2013257 (2001). https:\/\/doi.org\/10.1109\/70.938382","journal-title":"IEEE Trans. Robot. Autom."},{"issue":"3","key":"2702_CR77","doi-asserted-by":"publisher","first-page":"267","DOI":"10.1023\/A:1015217631658","volume":"12","author":"G Dissanayake","year":"2002","unstructured":"Dissanayake, G., Williams, S.B., Durrant-Whyte, H., Bailey, T.: Map management for efficient simultaneous localization and mapping (slam). Auton. Robot. 12(3), 267\u2013286 (2002). https:\/\/doi.org\/10.1023\/A:1015217631658","journal-title":"Auton. Robot."},{"issue":"5","key":"2702_CR78","doi-asserted-by":"publisher","first-page":"946","DOI":"10.1109\/TRO.2008.2004637","volume":"24","author":"LM Paz","year":"2008","unstructured":"Paz, L.M., Pini\u00e9s, P., Tard\u00f3s, J.D., Neira, J.: Large-scale 6-dof slam with stereo-in-hand. IEEE Trans. Robot. 24(5), 946\u2013957 (2008)","journal-title":"IEEE Trans. Robot."},{"issue":"5","key":"2702_CR79","doi-asserted-by":"publisher","first-page":"1002","DOI":"10.1109\/TRO.2008.2004888","volume":"24","author":"I Mahon","year":"2008","unstructured":"Mahon, I., Williams, S.B., Pizarro, O., Johnson-Roberson, M.: Efficient view-based slam using visual loop closures. IEEE Trans. Robot. 24(5), 1002\u20131014 (2008). https:\/\/doi.org\/10.1109\/TRO.2008.2004888","journal-title":"IEEE Trans. Robot."},{"issue":"11","key":"2702_CR80","doi-asserted-by":"publisher","first-page":"1207","DOI":"10.1016\/j.robot.2010.08.003","volume":"58","author":"C Cadena","year":"2010","unstructured":"Cadena, C., Neira, J.: Slam in o (logn) with the combined Kalman-information filter. Robot. Auton. Syst. 58(11), 1207\u20131219 (2010). https:\/\/doi.org\/10.1016\/j.robot.2010.08.003","journal-title":"Robot. Auton. Syst."},{"issue":"8","key":"2702_CR81","doi-asserted-by":"publisher","first-page":"19852","DOI":"10.3390\/s150819852","volume":"15","author":"B He","year":"2015","unstructured":"He, B., Liu, Y., Dong, D., Shen, Y., Yan, T., Nian, R.: Simultaneous localization and mapping with iterative sparse extended information filter for autonomous vehicles. Sensors 15(8), 19852\u201319879 (2015). https:\/\/doi.org\/10.3390\/s150819852","journal-title":"Sensors"},{"key":"2702_CR82","unstructured":"Wan, E.A., Van Der\u00a0Merwe, R.: The unscented Kalman filter for nonlinear estimation. In: Proceedings of the IEEE 2000 Adaptive Systems for Signal Processing, Communications, and Control Symposium (Cat. No. 00EX373), pp. 153\u2013158 (2000). IEEE"},{"issue":"5","key":"2702_CR83","doi-asserted-by":"publisher","first-page":"932","DOI":"10.1109\/TRO.2008.2003276","volume":"24","author":"J Civera","year":"2008","unstructured":"Civera, J., Davison, A.J., Montiel, J.M.: Inverse depth parametrization for monocular slam. IEEE Trans. Robot. 24(5), 932\u2013945 (2008). https:\/\/doi.org\/10.1109\/TRO.2008.2003276","journal-title":"IEEE Trans. Robot."},{"key":"2702_CR84","unstructured":"Montemerlo, M., Thrun, S., Koller, D., Wegbreit, B., et al.: Fastslam: A factored solution to the simultaneous localization and mapping problem. Aaai\/iaai Vol. 593598 (2002)"},{"key":"2702_CR85","unstructured":"Montemerlo, M., Thrun, S., Koller, D., Wegbreit, B., et al.: Fastslam 2.0: An improved particle filtering algorithm for simultaneous localization and mapping that provably converges. In: IJCAI, vol. 3, pp. 1151\u20131156 (2003)"},{"key":"2702_CR86","doi-asserted-by":"crossref","unstructured":"Pupilli, M., Calway, A.: Real-time camera tracking using a particle filter. In: BMVC (2005)","DOI":"10.5244\/C.19.50"},{"issue":"11","key":"2702_CR87","doi-asserted-by":"publisher","first-page":"305","DOI":"10.3390\/electronics7110305","volume":"7","author":"SA Hoseini","year":"2018","unstructured":"Hoseini, S.A., Kabiri, P.: A novel feature-based approach for indoor monocular slam. Electronics 7(11), 305 (2018). https:\/\/doi.org\/10.3390\/electronics7110305","journal-title":"Electronics"},{"key":"2702_CR88","doi-asserted-by":"crossref","unstructured":"Angeli, A., Doncieux, S., Meyer, J.-A., Filliat, D.: Real-time visual loop-closure detection. In: 2008 IEEE International Conference on Robotics and Automation, pp. 1842\u20131847 (2008). IEEE","DOI":"10.1109\/ROBOT.2008.4543475"},{"issue":"1","key":"2702_CR89","doi-asserted-by":"publisher","DOI":"10.1117\/1.JEI.23.1.013029","volume":"23","author":"S-H Lee","year":"2014","unstructured":"Lee, S.-H.: Real-time camera tracking using a particle filter combined with unscented kalman filters. J. Electron. Imaging 23(1), 013029 (2014). https:\/\/doi.org\/10.1117\/1.JEI.23.1.013029","journal-title":"J. Electron. Imaging"},{"issue":"4","key":"2702_CR90","doi-asserted-by":"publisher","first-page":"1364","DOI":"10.1109\/TVT.2015.2388780","volume":"64","author":"H Zhou","year":"2015","unstructured":"Zhou, H., Zou, D., Pei, L., Ying, R., Liu, P., Yu, W.: Structslam: Visual slam with building structure lines. IEEE Trans. Veh. Technol. 64(4), 1364\u20131375 (2015). https:\/\/doi.org\/10.1109\/TVT.2015.2388780","journal-title":"IEEE Trans. Veh. Technol."},{"issue":"8","key":"2702_CR91","doi-asserted-by":"publisher","first-page":"1162","DOI":"10.1080\/17517575.2019.1698772","volume":"15","author":"K-K Tseng","year":"2021","unstructured":"Tseng, K.-K., Li, J., Chang, Y., Yung, K., Chan, C., Hsu, C.-Y.: A new architecture for simultaneous localization and mapping: an application of a planetary rover. Enterprise Inf. Syst. 15(8), 1162\u20131178 (2021). https:\/\/doi.org\/10.1080\/17517575.2019.1698772","journal-title":"Enterprise Inf. Syst."},{"issue":"8","key":"2702_CR92","doi-asserted-by":"publisher","first-page":"930","DOI":"10.1109\/TPAMI.2003.1217599","volume":"25","author":"X-S Gao","year":"2003","unstructured":"Gao, X.-S., Hou, X.-R., Tang, J., Cheng, H.-F.: Complete solution classification for the perspective-three-point problem. IEEE Trans. Pattern Anal. Mach. Intell. 25(8), 930\u2013943 (2003). https:\/\/doi.org\/10.1109\/TPAMI.2003.1217599","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"2","key":"2702_CR93","doi-asserted-by":"publisher","first-page":"155","DOI":"10.1007\/s11263-008-0152-6","volume":"81","author":"V Lepetit","year":"2009","unstructured":"Lepetit, V., Moreno-Noguer, F., Fua, P.: Epnp: an accurate o (n) solution to the pnp problem. Int. J. Comput. Vis. 81(2), 155 (2009). https:\/\/doi.org\/10.1007\/s11263-008-0152-6","journal-title":"Int. J. Comput. Vis."},{"key":"2702_CR94","doi-asserted-by":"crossref","unstructured":"Persson, M., Nordberg, K.: Lambda twist: An accurate fast robust perspective three point (p3p) solver. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 318\u2013332 (2018)","DOI":"10.1007\/978-3-030-01225-0_20"},{"key":"2702_CR95","doi-asserted-by":"crossref","unstructured":"Blochliger, F., Fehr, M., Dymczyk, M., Schneider, T., Siegwart, R.: Topomap: Topological mapping and navigation based on visual slam maps. In: 2018 IEEE International Conference on Robotics and Automation (ICRA), pp. 3818\u20133825 (2018). IEEE","DOI":"10.1109\/ICRA.2018.8460641"},{"key":"2702_CR96","doi-asserted-by":"crossref","unstructured":"Yang, A., Luo, Y., Chen, L., Xu, Y.: Survey of 3d map in slam: localization and navigation. In: Advanced Computational Methods in Life System Modeling and Simulation, pp. 410\u2013420. Springer (2017)","DOI":"10.1007\/978-981-10-6370-1_41"},{"key":"2702_CR97","unstructured":"Cai, Q., Zhang, L., Wu, Y., Yu, W., Hu, D.: A pose-only solution to visual reconstruction and navigation. arXiv preprint arXiv:2103.01530 (2021)"},{"key":"2702_CR98","doi-asserted-by":"crossref","unstructured":"Newcombe, R.A., Lovegrove, S.J., Davison, A.J.: Dtam: Dense tracking and mapping in real-time. In: 2011 International Conference on Computer Vision, pp. 2320\u20132327 (2011). IEEE","DOI":"10.1109\/ICCV.2011.6126513"},{"key":"2702_CR99","doi-asserted-by":"crossref","unstructured":"Engel, J., Sch\u00f6ps, T., Cremers, D.: Lsd-slam: Large-scale direct monocular slam. In: European Conference on Computer Vision, pp. 834\u2013849 (2014). Springer","DOI":"10.1007\/978-3-319-10605-2_54"},{"issue":"2","key":"2702_CR100","doi-asserted-by":"publisher","first-page":"249","DOI":"10.1109\/TRO.2016.2623335","volume":"33","author":"C Forster","year":"2016","unstructured":"Forster, C., Zhang, Z., Gassner, M., Werlberger, M., Scaramuzza, D.: Svo: Semidirect visual odometry for monocular and multicamera systems. IEEE Trans. Rob. 33(2), 249\u2013265 (2016). https:\/\/doi.org\/10.1109\/TRO.2016.2623335","journal-title":"IEEE Trans. Rob."},{"key":"2702_CR101","doi-asserted-by":"crossref","unstructured":"Concha, A., Civera, J.: Dpptam: Dense piecewise planar tracking and mapping from a monocular sequence. In: 2015 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS), pp. 5686\u20135693 (2015). IEEE","DOI":"10.1109\/IROS.2015.7354184"},{"issue":"3","key":"2702_CR102","doi-asserted-by":"publisher","first-page":"611","DOI":"10.1109\/TPAMI.2017.2658577","volume":"40","author":"J Engel","year":"2017","unstructured":"Engel, J., Koltun, V., Cremers, D.: Direct sparse odometry. IEEE Trans. Pattern Anal. Mach. Intell. 40(3), 611\u2013625 (2017). https:\/\/doi.org\/10.1109\/TPAMI.2017.2658577","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"4","key":"2702_CR103","doi-asserted-by":"publisher","first-page":"1363","DOI":"10.1109\/TRO.2020.2991614","volume":"36","author":"J Zubizarreta","year":"2020","unstructured":"Zubizarreta, J., Aguinaga, I., Montiel, J.M.M.: Direct sparse mapping. IEEE Trans. Robot. 36(4), 1363\u20131370 (2020). https:\/\/doi.org\/10.1109\/TRO.2020.2991614","journal-title":"IEEE Trans. Robot."},{"key":"2702_CR104","doi-asserted-by":"crossref","unstructured":"Roberts, R., Nguyen, H., Krishnamurthi, N., Balch, T.: Memory-based learning for visual odometry. In: 2008 IEEE International Conference on Robotics and Automation, pp. 47\u201352 (2008). IEEE","DOI":"10.1109\/ROBOT.2008.4543185"},{"issue":"5","key":"2702_CR105","doi-asserted-by":"publisher","first-page":"526","DOI":"10.1177\/2F0278364912472245","volume":"32","author":"V Guizilini","year":"2013","unstructured":"Guizilini, V., Ramos, F.: Semi-parametric learning for visual odometry. Tnt. J. Robot. Res. 32(5), 526\u2013546 (2013). https:\/\/doi.org\/10.1177\/2F0278364912472245","journal-title":"Tnt. J. Robot. Res."},{"key":"2702_CR106","doi-asserted-by":"crossref","unstructured":"Konda, K.R., Memisevic, R.: Learning visual odometry with a convolutional network. In: VISAPP (1), pp. 486\u2013490 (2015)","DOI":"10.5220\/0005299304860490"},{"key":"2702_CR107","unstructured":"DeTone, D., Malisiewicz, T., Rabinovich, A.: Deep image homography estimation. arXiv preprint arXiv:1606.03798 (2016)"},{"issue":"1","key":"2702_CR108","doi-asserted-by":"publisher","first-page":"18","DOI":"10.1109\/TITS.2019.2952159","volume":"1","author":"G Costante","year":"2015","unstructured":"Costante, G., Mancini, M., Valigi, P., Ciarfuglia, T.A.: Exploring representation learning with cnns for frame-to-frame ego-motion estimation. IEEE Robot. Autom. Lett. 1(1), 18\u201325 (2015). https:\/\/doi.org\/10.1109\/TITS.2019.2952159","journal-title":"IEEE Robot. Autom. Lett."},{"key":"2702_CR109","doi-asserted-by":"crossref","unstructured":"Muller, P., Savakis, A.: Flowdometry: An optical flow and deep learning based approach to visual odometry. In: 2017 IEEE Winter Conference on Applications of Computer Vision (WACV), pp. 624\u2013631 (2017). IEEE","DOI":"10.1109\/WACV.2017.75"},{"key":"2702_CR110","doi-asserted-by":"crossref","unstructured":"Dosovitskiy, A., Fischer, P., Ilg, E., Hausser, P., Hazirbas, C., Golkov, V., Van Der\u00a0Smagt, P., Cremers, D., Brox, T.: Flownet: Learning optical flow with convolutional networks. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 2758\u20132766 (2015)","DOI":"10.1109\/ICCV.2015.316"},{"key":"2702_CR111","doi-asserted-by":"crossref","unstructured":"Ummenhofer, B., Zhou, H., Uhrig, J., Mayer, N., Ilg, E., Dosovitskiy, A., Brox, T.: Demon: Depth and motion network for learning monocular stereo. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 5038\u20135047 (2017)","DOI":"10.1109\/CVPR.2017.596"},{"issue":"3","key":"2702_CR112","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1109\/LRA.2018.2803211","volume":"3","author":"G Costante","year":"2018","unstructured":"Costante, G., Ciarfuglia, T.A.: Ls-vo: Learning dense optical subspace for robust visual odometry estimation. IEEE Robot. Autom. Lett. 3(3), 1735\u20131742 (2018). https:\/\/doi.org\/10.1109\/LRA.2018.2803211","journal-title":"IEEE Robot. Autom. Lett."},{"issue":"4","key":"2702_CR113","doi-asserted-by":"publisher","first-page":"1313","DOI":"10.3390\/s21041313","volume":"21","author":"T Pandey","year":"2021","unstructured":"Pandey, T., Pena, D., Byrne, J., Moloney, D.: Leveraging deep learning for visual odometry using optical flow. Sensors 21(4), 1313 (2021). https:\/\/doi.org\/10.3390\/s21041313","journal-title":"Sensors"},{"key":"2702_CR114","doi-asserted-by":"publisher","unstructured":"Wang, H., Ban, X., Ding, F., Xiao, Y., Zhou, J.: Monocular vo based on deep siamese convolutional neural network. Complexity (2020). https:\/\/doi.org\/10.1155\/2020\/6367273","DOI":"10.1155\/2020\/6367273"},{"key":"2702_CR115","doi-asserted-by":"crossref","unstructured":"Saputra, M.R.U., de Gusmao, P.P., Wang, S., Markham, A., Trigoni, N.: Learning monocular visual odometry through geometry-aware curriculum learning. In: 2019 International Conference on Robotics and Automation (ICRA), pp. 3549\u20133555 (2019). IEEE","DOI":"10.1109\/ICRA.2019.8793581"},{"issue":"4\u20135","key":"2702_CR116","doi-asserted-by":"publisher","first-page":"513","DOI":"10.1177\/2F0278364917734298","volume":"37","author":"S Wang","year":"2018","unstructured":"Wang, S., Clark, R., Wen, H., Trigoni, N.: End-to-end, sequence-to-sequence probabilistic visual odometry through deep neural networks. Int. J. Robot. Res. 37(4\u20135), 513\u2013542 (2018). https:\/\/doi.org\/10.1177\/2F0278364917734298","journal-title":"Int. J. Robot. Res."},{"key":"2702_CR117","doi-asserted-by":"crossref","unstructured":"Kendall, A., Cipolla, R.: Geometric loss functions for camera pose regression with deep learning. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 5974\u20135983 (2017)","DOI":"10.1109\/CVPR.2017.694"},{"issue":"23","key":"2702_CR118","doi-asserted-by":"publisher","first-page":"8155","DOI":"10.3390\/s21238155","volume":"21","author":"N Gadipudi","year":"2021","unstructured":"Gadipudi, N., Elamvazuthi, I., Lu, C.-K., Paramasivam, S., Su, S.: Wpo-net: Windowed pose optimization network for monocular visual odometry estimation. Sensors 21(23), 8155 (2021). https:\/\/doi.org\/10.3390\/s21238155","journal-title":"Sensors"},{"key":"2702_CR119","doi-asserted-by":"publisher","first-page":"175220","DOI":"10.1109\/ACCESS.2020.3025557","volume":"8","author":"X Wang","year":"2020","unstructured":"Wang, X., Zhang, H.: Deep monocular visual odometry for ground vehicle. IEEE Access 8, 175220\u2013175229 (2020). https:\/\/doi.org\/10.1109\/ACCESS.2020.3025557","journal-title":"IEEE Access"},{"key":"2702_CR120","doi-asserted-by":"crossref","unstructured":"Saputra, M.R.U., de Gusmao, P.P., Almalioglu, Y., Markham, A., Trigoni, N.: Distilling knowledge from a deep pose regressor network. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 263\u2013272 (2019)","DOI":"10.1109\/ICCV.2019.00035"},{"key":"2702_CR121","doi-asserted-by":"crossref","unstructured":"Koumis, A.S., Preiss, J.A., Sukhatme, G.S.: Estimating metric scale visual odometry from videos using 3d convolutional networks. In: 2019 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS), pp. 265\u2013272 (2019). IEEE","DOI":"10.1109\/IROS40897.2019.8967919"},{"key":"2702_CR122","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2019.107187","volume":"102","author":"G Zhai","year":"2020","unstructured":"Zhai, G., Liu, L., Zhang, L., Liu, Y., Jiang, Y.: Poseconvgru: a monocular approach for visual ego-motion estimation by learning. Pattern Recogn. 102, 107187 (2020). https:\/\/doi.org\/10.1016\/j.patcog.2019.107187","journal-title":"Pattern Recogn."},{"key":"2702_CR123","doi-asserted-by":"crossref","unstructured":"Kuo, X.-Y., Liu, C., Lin, K.-C., Lee, C.-Y.: Dynamic attention-based visual odometry. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops, pp. 36\u201337 (2020)","DOI":"10.1109\/CVPRW50498.2020.00026"},{"key":"2702_CR124","doi-asserted-by":"publisher","unstructured":"Gadipudi, N., Elamvazuthi, I., Lu, C.-K., Paramasivam, S., Su, S.: Lightweight spatial attentive network for vehicular visual odometry estimation in urban environments. Neural Computing and Applications, 1\u201314 (2022). https:\/\/doi.org\/10.1007\/s00521-022-07484-y","DOI":"10.1007\/s00521-022-07484-y"},{"key":"2702_CR125","doi-asserted-by":"crossref","unstructured":"Xue, F., Wang, X., Li, S., Wang, Q., Wang, J., Zha, H.: Beyond tracking: Selecting memory and refining poses for deep visual odometry. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 8575\u20138583 (2019)","DOI":"10.1109\/CVPR.2019.00877"},{"key":"2702_CR126","doi-asserted-by":"crossref","unstructured":"Xu, S., Xiong, H., Wu, Q., Wang, Z.: Attention-based long-term modeling for deep visual odometry. In: 2021 Digital Image Computing: Techniques and Applications (DICTA), pp. 1\u20138. IEEE","DOI":"10.1109\/DICTA52665.2021.9647140"},{"key":"2702_CR127","doi-asserted-by":"crossref","unstructured":"Mayer, N., Ilg, E., Hausser, P., Fischer, P., Cremers, D., Dosovitskiy, A., Brox, T.: A large dataset to train convolutional networks for disparity, optical flow, and scene flow estimation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4040\u20134048 (2016)","DOI":"10.1109\/CVPR.2016.438"},{"key":"2702_CR128","doi-asserted-by":"crossref","unstructured":"Garg, R., Bg, V.K., Carneiro, G., Reid, I.: Unsupervised cnn for single view depth estimation: geometry to the rescue. In: European Conference on Computer Vision, pp. 740\u2013756 (2016). Springer","DOI":"10.1007\/978-3-319-46484-8_45"},{"key":"2702_CR129","doi-asserted-by":"crossref","unstructured":"Kendall, A., Grimes, M., Cipolla, R.: Posenet: A convolutional network for real-time 6-dof camera relocalization. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 2938\u20132946 (2015)","DOI":"10.1109\/ICCV.2015.336"},{"key":"2702_CR130","unstructured":"Jaderberg, M., Simonyan, K., Zisserman, A., Kavukcuoglu, K.: Spatial transformer networks. arXiv preprint arXiv:1506.02025 (2015)"},{"key":"2702_CR131","doi-asserted-by":"crossref","unstructured":"Zhou, T., Brown, M., Snavely, N., Lowe, D.G.: Unsupervised learning of depth and ego-motion from video. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1851\u20131858 (2017)","DOI":"10.1109\/CVPR.2017.700"},{"key":"2702_CR132","doi-asserted-by":"crossref","unstructured":"Prasad, V., Bhowmick, B.: Sfmlearner++: Learning monocular depth and ego-motion using meaningful geometric constraints. In: 2019 IEEE Winter Conference on Applications of Computer Vision (WACV), pp. 2087\u20132096 (2019). IEEE","DOI":"10.1109\/WACV.2019.00226"},{"key":"2702_CR133","doi-asserted-by":"crossref","unstructured":"Yin, Z., Shi, J.: Geonet: Unsupervised learning of dense depth, optical flow and camera pose. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1983\u20131992 (2018)","DOI":"10.1109\/CVPR.2018.00212"},{"key":"2702_CR134","doi-asserted-by":"crossref","unstructured":"Zou, Y., Luo, Z., Huang, J.-B.: Df-net: Unsupervised joint learning of depth and flow using cross-task consistency. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 36\u201353 (2018)","DOI":"10.1007\/978-3-030-01228-1_3"},{"issue":"12","key":"2702_CR135","doi-asserted-by":"publisher","DOI":"10.1063\/1.5120605","volume":"29","author":"Q Sun","year":"2019","unstructured":"Sun, Q., Tang, Y., Zhao, C.: Cycle-sfm: Joint self-supervised learning of depth and camera motion from monocular image sequences. Chaos: Interdiscip. J. Nonlinear Sci. 29(12), 123102 (2019). https:\/\/doi.org\/10.1063\/1.5120605","journal-title":"Chaos: Interdiscip. J. Nonlinear Sci."},{"key":"2702_CR136","unstructured":"Goodfellow, I.J., Pouget-Abadie, J., Mirza, M., Xu, B., Warde-Farley, D., Ozair, S., Courville, A., Bengio, Y.: Generative adversarial networks. arXiv preprint arXiv:1406.2661 (2014)"},{"key":"2702_CR137","doi-asserted-by":"crossref","unstructured":"Almalioglu, Y., Saputra, M.R.U., de Gusmao, P.P., Markham, A., Trigoni, N.: Ganvo: Unsupervised deep monocular visual odometry and depth estimation with generative adversarial networks. In: 2019 International Conference on Robotics and Automation (ICRA), pp. 5474\u20135480 (2019). IEEE","DOI":"10.1109\/ICRA.2019.8793512"},{"key":"2702_CR138","doi-asserted-by":"crossref","unstructured":"Li, S., Xue, F., Wang, X., Yan, Z., Zha, H.: Sequential adversarial learning for self-supervised deep visual odometry. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 2851\u20132860 (2019)","DOI":"10.1109\/ICCV.2019.00294"},{"key":"2702_CR139","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2020.3044181","author":"C Zhao","year":"2020","unstructured":"Zhao, C., Yen, G.G., Sun, Q., Zhang, C., Tang, Y.: Masked gan for unsupervised depth and pose prediction with scale consistency. IEEE Trans. Neural Netw. Learn. Syst. (2020). https:\/\/doi.org\/10.1109\/TNNLS.2020.3044181","journal-title":"IEEE Trans. Neural Netw. Learn. Syst."},{"key":"2702_CR140","unstructured":"Bian, J.-W., Li, Z., Wang, N., Zhan, H., Shen, C., Cheng, M.-M., Reid, I.: Unsupervised scale-consistent depth and ego-motion learning from monocular video. arXiv preprint arXiv:1908.10553 (2019)"},{"key":"2702_CR141","doi-asserted-by":"crossref","unstructured":"Zou, Y., Ji, P., Tran, Q.-H., Huang, J.-B., Chandraker, M.: Learning monocular visual odometry via self-supervised long-term modeling. In: Proceedings of 16th European Conference Computer Vision\u2013ECCV 2020, Glasgow, UK, August 23\u201328, 2020, Part XIV 16, pp. 710\u2013727 (2020). Springer","DOI":"10.1007\/978-3-030-58568-6_42"},{"key":"2702_CR142","doi-asserted-by":"crossref","unstructured":"Lu, Y., Xu, X., Ding, M., Lu, Z., Xiang, T.: A global occlusion-aware approach to self-supervised monocular visual odometry. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 35, pp. 2260\u20132268 (2021)","DOI":"10.1609\/aaai.v35i3.16325"},{"key":"2702_CR143","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2021.3053412","author":"Y Liu","year":"2021","unstructured":"Liu, Y., Wang, H., Wang, J., Wang, X.: Unsupervised monocular visual odometry based on confidence evaluation. IEEE Trans. Intell. Transp. Syst. (2021). https:\/\/doi.org\/10.1109\/TITS.2021.3053412","journal-title":"IEEE Trans. Intell. Transp. Syst."},{"key":"2702_CR144","doi-asserted-by":"crossref","unstructured":"Sarlin, P.-E., Unagar, A., Larsson, M., Germain, H., Toft, C., Larsson, V., Pollefeys, M., Lepetit, V., Hammarstrand, L., Kahl, F., et al.: Back to the feature: Learning robust camera localization from pixels to pose. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 3247\u20133257 (2021)","DOI":"10.1109\/CVPR46437.2021.00326"},{"issue":"3","key":"2702_CR145","doi-asserted-by":"publisher","first-page":"615","DOI":"10.1007\/s13042-019-01020-6","volume":"11","author":"J Zhang","year":"2020","unstructured":"Zhang, J., Su, Q., Liu, P., Xu, C., Chen, Y.: Unsupervised learning of monocular depth and ego-motion with space-temporal-centroid loss. Int. J. Mach. Learn. Cybern. 11(3), 615\u2013627 (2020). https:\/\/doi.org\/10.1007\/s13042-019-01020-6","journal-title":"Int. J. Mach. Learn. Cybern."},{"key":"2702_CR146","doi-asserted-by":"publisher","first-page":"18076","DOI":"10.1109\/ACCESS.2019.2896988","volume":"7","author":"Q Liu","year":"2019","unstructured":"Liu, Q., Li, R., Hu, H., Gu, D.: Using unsupervised deep learning technique for monocular visual odometry. Ieee Access 7, 18076\u201318088 (2019). https:\/\/doi.org\/10.1109\/ACCESS.2019.2896988","journal-title":"Ieee Access"},{"key":"2702_CR147","doi-asserted-by":"publisher","first-page":"4130","DOI":"10.1109\/TIP.2020.2968751","volume":"29","author":"A Wang","year":"2020","unstructured":"Wang, A., Fang, Z., Gao, Y., Tan, S., Wang, S., Ma, S., Hwang, J.-N.: Adversarial learning for joint optimization of depth and ego-motion. IEEE Trans. Image Process. 29, 4130\u20134142 (2020). https:\/\/doi.org\/10.1109\/TIP.2020.2968751","journal-title":"IEEE Trans. Image Process."},{"key":"2702_CR148","doi-asserted-by":"crossref","unstructured":"Ding, Y., Barath, D., Yang, J., Kukelova, Z.: Relative pose from a calibrated and an uncalibrated smartphone image. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 12766\u201312775 (2022)","DOI":"10.1109\/CVPR52688.2022.01243"},{"key":"2702_CR149","unstructured":"Paszke, A., Gross, S., Massa, F., Lerer, A., Bradbury, J., Chanan, G., Killeen, T., Lin, Z., Gimelshein, N., Antiga, L., Desmaison, A., K\u00f6pf, A., Yang, E., DeVito, Z., Raison, M., Tejani, A., Chilamkurthy, S., Steiner, B., Fang, L., Bai, J., Chintala, S.: Pytorch: An imperative style, high-performance deep learning library. In: NeurIPS (2019)"},{"key":"2702_CR150","unstructured":"Abadi, M., Barham, P., Chen, J., Chen, Z., Davis, A., Dean, J., Devin, M., Ghemawat, S., Irving, G., Isard, M., Kudlur, M., Levenberg, J., Monga, R., Moore, S., Murray, D., Steiner, B., Tucker, P., Vasudevan, V., Warden, P., Wicke, M., Yu, Y., Zhang, X.: Tensorflow: A system for large-scale machine learning. In: OSDI (2016)"},{"key":"2702_CR151","unstructured":"Chen, T., Li, M., Li, Y., Lin, M., Wang, N., Wang, M., Xiao, T., Xu, B., Zhang, C., Zhang, Z.: Mxnet: A flexible and efficient machine learning library for heterogeneous distributed systems. arXiv:1512.01274 (2015)"},{"key":"2702_CR152","doi-asserted-by":"publisher","DOI":"10.1016\/j.neunet.2020.07.025","author":"C Tian","year":"2020","unstructured":"Tian, C., Fei, L., Zheng, W., Xu, Y., Zuo, W., Lin, C.-W.: Deep learning on image denoising: an overview. Neural Netw. (2020). https:\/\/doi.org\/10.1016\/j.neunet.2020.07.025","journal-title":"Neural Netw."},{"key":"2702_CR153","doi-asserted-by":"crossref","unstructured":"Tao, X., Gao, H., Wang, Y., Shen, X., Wang, J., Jia, J.: Scale-recurrent network for deep image deblurring. 2018 IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 8174\u20138182 (2018)","DOI":"10.1109\/CVPR.2018.00853"},{"key":"2702_CR154","doi-asserted-by":"publisher","first-page":"295","DOI":"10.1109\/TPAMI.2015.2439281","volume":"38","author":"C Dong","year":"2016","unstructured":"Dong, C., Loy, C.C., He, K., Tang, X.: Image super-resolution using deep convolutional networks. IEEE Trans. Pattern Anal. Mach. Intell. 38, 295\u2013307 (2016). https:\/\/doi.org\/10.1109\/TPAMI.2015.2439281","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"2702_CR155","doi-asserted-by":"crossref","unstructured":"Yi, K., Trulls, E., Lepetit, V., Fua, P.: Lift: Learned invariant feature transform. arXiv:1603.09114 (2016)","DOI":"10.1007\/978-3-319-46466-4_28"},{"key":"2702_CR156","doi-asserted-by":"crossref","unstructured":"DeTone, D., Malisiewicz, T., Rabinovich, A.: Superpoint: Self-supervised interest point detection and description. 2018 IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops (CVPRW), 337\u201333712 (2018)","DOI":"10.1109\/CVPRW.2018.00060"},{"key":"2702_CR157","unstructured":"Ono, Y., Trulls, E., Fua, P., Yi, K.: Lf-net: Learning local features from images. In: NeurIPS (2018)"},{"key":"2702_CR158","doi-asserted-by":"crossref","unstructured":"Altwaijry, H., Veit, A., Belongie, S.J.: Learning to detect and match keypoints with deep architectures. In: BMVC (2016)","DOI":"10.5244\/C.30.49"},{"issue":"3","key":"2702_CR159","doi-asserted-by":"publisher","first-page":"2346","DOI":"10.1109\/LRA.2018.2809549","volume":"3","author":"T Nguyen","year":"2018","unstructured":"Nguyen, T., Chen, S.W., Shivakumar, S.S., Taylor, C.J., Kumar, V.: Unsupervised deep homography: a fast and robust homography estimation model. IEEE Robot. Autom. Lett. 3(3), 2346\u20132353 (2018). https:\/\/doi.org\/10.1109\/LRA.2018.2809549","journal-title":"IEEE Robot. Autom. Lett."},{"key":"2702_CR160","doi-asserted-by":"crossref","unstructured":"Ranftl, R., Koltun, V.: Deep fundamental matrix estimation. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 284\u2013299 (2018)","DOI":"10.1007\/978-3-030-01246-5_18"},{"key":"2702_CR161","doi-asserted-by":"crossref","unstructured":"Balntas, V., Li, S., Prisacariu, V.: Relocnet: Continuous metric learning relocalisation using neural nets. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 751\u2013767 (2018)","DOI":"10.1007\/978-3-030-01264-9_46"},{"key":"2702_CR162","doi-asserted-by":"crossref","unstructured":"Valada, A., Radwan, N., Burgard, W.: Deep auxiliary learning for visual localization and odometry. 2018 IEEE International Conference on Robotics and Automation (ICRA), 6939\u20136946 (2018)","DOI":"10.1109\/ICRA.2018.8462979"},{"key":"2702_CR163","doi-asserted-by":"publisher","first-page":"4407","DOI":"10.1109\/LRA.2018.2869640","volume":"3","author":"N Radwan","year":"2018","unstructured":"Radwan, N., Valada, A., Burgard, W.: Vlocnet++: deep multitask learning for semantic visual localization and odometry. IEEE Robot. Autom. Lett. 3, 4407\u20134414 (2018). https:\/\/doi.org\/10.1109\/LRA.2018.2869640","journal-title":"IEEE Robot. Autom. Lett."},{"key":"2702_CR164","doi-asserted-by":"crossref","unstructured":"Brachmann, E., Krull, A., Nowozin, S., Shotton, J., Michel, F., Gumhold, S., Rother, C.: Dsac - differentiable ransac for camera localization. 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), 2492\u20132500 (2017)","DOI":"10.1109\/CVPR.2017.267"},{"key":"2702_CR165","doi-asserted-by":"crossref","unstructured":"Brachmann, E., Rother, C.: Learning less is more - 6d camera localization via 3d surface regression. 2018 IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 4654\u20134662 (2018)","DOI":"10.1109\/CVPR.2018.00489"},{"key":"2702_CR166","doi-asserted-by":"crossref","unstructured":"Brachmann, E., Rother, C.: Expert sample consensus applied to camera re-localization. 2019 IEEE\/CVF International Conference on Computer Vision (ICCV), 7524\u20137533 (2019)","DOI":"10.1109\/ICCV.2019.00762"},{"key":"2702_CR167","doi-asserted-by":"crossref","unstructured":"Barath, D., Cavalli, L., Pollefeys, M.: Learning to find good models in ransac. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp. 15744\u201315753 (2022)","DOI":"10.1109\/CVPR52688.2022.01529"},{"key":"2702_CR168","doi-asserted-by":"crossref","unstructured":"Yin, X., Wang, X., Du, X., Chen, Q.: Scale recovery for monocular visual odometry using depth estimated with deep convolutional neural fields. 2017 IEEE International Conference on Computer Vision (ICCV), 5871\u20135879 (2017)","DOI":"10.1109\/ICCV.2017.625"},{"key":"2702_CR169","doi-asserted-by":"crossref","unstructured":"S\u00fcnderhauf, N., Shirazi, S., Jacobson, A., Dayoub, F., Pepperell, E., Upcroft, B., Milford, M.: Place recognition with convnet landmarks: Viewpoint-robust, condition-robust, training-free. In: Robotics: Science and Systems (2015)","DOI":"10.15607\/RSS.2015.XI.022"},{"key":"2702_CR170","doi-asserted-by":"crossref","unstructured":"Merrill, N., Huang, G.: Lightweight unsupervised deep loop closure. arXiv:1805.07703 (2018)","DOI":"10.15607\/RSS.2018.XIV.032"},{"key":"2702_CR171","doi-asserted-by":"publisher","DOI":"10.1016\/j.robot.2020.103470","volume":"126","author":"AR Memon","year":"2020","unstructured":"Memon, A.R., Wang, H., Hussain, A.: Loop closure detection using supervised and unsupervised deep neural networks for monocular slam systems. Robot. Auton. Syst. 126, 103470 (2020). https:\/\/doi.org\/10.1016\/j.robot.2020.103470","journal-title":"Robot. Auton. Syst."},{"key":"2702_CR172","doi-asserted-by":"crossref","unstructured":"Clark, R., Bloesch, M., Czarnowski, J., Leutenegger, S., Davison, A.: Ls-net: Learning to solve nonlinear least squares for monocular stereo. arXiv:1809.02966 (2018)","DOI":"10.1007\/978-3-030-01237-3_18"},{"key":"2702_CR173","unstructured":"Tang, C., Tan, P.: Ba-net: Dense bundle adjustment network. arXiv:1806.04807 (2018)"},{"issue":"3","key":"2702_CR174","doi-asserted-by":"publisher","first-page":"756","DOI":"10.1007\/s11263-019-01221-0","volume":"128","author":"H Zhou","year":"2020","unstructured":"Zhou, H., Ummenhofer, B., Brox, T.: Deeptam: deep tracking and mapping with convolutional neural networks. Int. J. Comput. Vis. 128(3), 756\u2013769 (2020). https:\/\/doi.org\/10.1007\/s11263-019-01221-0","journal-title":"Int. J. Comput. Vis."},{"key":"2702_CR175","doi-asserted-by":"crossref","unstructured":"Tiwari, L., Ji, P., Tran, Q.-H., Zhuang, B., Anand, S., Chandraker, M.: Pseudo rgb-d for self-improving monocular slam and depth prediction. In: European Conference on Computer Vision, pp. 437\u2013455 (2020). Springer","DOI":"10.1007\/978-3-030-58621-8_26"},{"key":"2702_CR176","doi-asserted-by":"crossref","unstructured":"Loo, S.Y., Amiri, A.J., Mashohor, S., Tang, S.H., Zhang, H.: Cnn-svo: Improving the mapping in semi-direct visual odometry using single-image depth prediction. In: 2019 International Conference on Robotics and Automation (ICRA), pp. 5218\u20135223 (2019). IEEE","DOI":"10.1109\/ICRA.2019.8794425"},{"issue":"4","key":"2702_CR177","doi-asserted-by":"publisher","first-page":"202","DOI":"10.3390\/ijgi9040202","volume":"9","author":"J Cheng","year":"2020","unstructured":"Cheng, J., Wang, Z., Zhou, H., Li, L., Yao, J.: Dm-slam: a feature-based slam system for rigid dynamic scenes. ISPRS Int. J. Geo Inf. 9(4), 202 (2020). https:\/\/doi.org\/10.3390\/ijgi9040202","journal-title":"ISPRS Int. J. Geo Inf."},{"key":"2702_CR178","doi-asserted-by":"crossref","unstructured":"Yang, N., Stumberg, L.v., Wang, R., Cremers, D.: D3vo: Deep depth, deep pose and deep uncertainty for monocular visual odometry. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 1281\u20131292 (2020)","DOI":"10.1109\/CVPR42600.2020.00136"},{"key":"2702_CR179","doi-asserted-by":"publisher","first-page":"1231","DOI":"10.1177\/2F0278364913491297","volume":"32","author":"A Geiger","year":"2013","unstructured":"Geiger, A., Lenz, P., Stiller, C., Urtasun, R.: Vision meets robotics: The kitti dataset. Int. J. Robot. Res. 32, 1231\u20131237 (2013). https:\/\/doi.org\/10.1177\/2F0278364913491297","journal-title":"Int. J. Robot. Res."},{"key":"2702_CR180","doi-asserted-by":"publisher","first-page":"207","DOI":"10.1177\/2F0278364913507326","volume":"33","author":"J-L Blanco-Claraco","year":"2014","unstructured":"Blanco-Claraco, J.-L., Moreno, F.A., Gonz\u00e1lez, J.: The m\u00e1laga urban dataset: High-rate stereo and lidar in a realistic urban scenario. Int. J. Robot. Res. 33, 207\u2013214 (2014). https:\/\/doi.org\/10.1177\/2F0278364913507326","journal-title":"Int. J. Robot. Res."},{"key":"2702_CR181","doi-asserted-by":"crossref","unstructured":"Sturm, J., Engelhard, N., Endres, F., Burgard, W., Cremers, D.: A benchmark for the evaluation of rgb-d slam systems. 2012 IEEE\/RSJ International Conference on Intelligent Robots and Systems, 573\u2013580 (2012)","DOI":"10.1109\/IROS.2012.6385773"},{"key":"2702_CR182","doi-asserted-by":"publisher","first-page":"15","DOI":"10.1177\/2F0278364916679498","volume":"36","author":"W Maddern","year":"2017","unstructured":"Maddern, W., Pascoe, G., Linegar, C., Newman, P.: 1 year, 1000 km: The oxford robotcar dataset. Int. J. Robot. Res. 36, 15\u201330 (2017). https:\/\/doi.org\/10.1177\/2F0278364916679498","journal-title":"Int. J. Robot. Res."},{"key":"2702_CR183","doi-asserted-by":"publisher","first-page":"1023","DOI":"10.1177\/2F0278364915614638","volume":"35","author":"N Carlevaris-Bianco","year":"2016","unstructured":"Carlevaris-Bianco, N., Ushani, A.K., Eustice, R.: University of michigan north campus long-term vision and lidar dataset. Int. J. Robot. Res. 35, 1023\u20131035 (2016). https:\/\/doi.org\/10.1177\/2F0278364915614638","journal-title":"Int. J. Robot. Res."},{"key":"2702_CR184","doi-asserted-by":"publisher","first-page":"1157","DOI":"10.1177\/2F0278364915620033","volume":"35","author":"M Burri","year":"2016","unstructured":"Burri, M., Nikolic, J., Gohl, P., Schneider, T., Rehder, J., Omari, S., Achtelik, M., Siegwart, R.: The Euroc micro aerial vehicle datasets. Int. J. Robot. Res. 35, 1157\u20131163 (2016). https:\/\/doi.org\/10.1177\/2F0278364915620033","journal-title":"Int. J. Robot. Res."},{"key":"2702_CR185","doi-asserted-by":"publisher","first-page":"269","DOI":"10.1177\/2F0278364917702237","volume":"36","author":"A Majdik","year":"2017","unstructured":"Majdik, A., Till, C., Scaramuzza, D.: The zurich urban micro aerial vehicle dataset. Int. J. Robot. Res. 36, 269\u2013273 (2017). https:\/\/doi.org\/10.1177\/2F0278364917702237","journal-title":"Int. J. Robot. Res."},{"key":"2702_CR186","doi-asserted-by":"publisher","first-page":"595","DOI":"10.1177\/2F0278364909103911","volume":"28","author":"M Smith","year":"2009","unstructured":"Smith, M., Baldwin, I., Churchill, W., Paul, R., Newman, P.: The new college vision and laser data set. Int. J. Robot. Res. 28, 595\u2013599 (2009). https:\/\/doi.org\/10.1177\/2F0278364909103911","journal-title":"Int. J. Robot. Res."},{"key":"2702_CR187","doi-asserted-by":"publisher","first-page":"1595","DOI":"10.1177\/2F0278364910384295","volume":"29","author":"AS Huang","year":"2010","unstructured":"Huang, A.S., Antone, M.E., Olson, E., Fletcher, L., Moore, D., Teller, S., Leonard, J.: A high-rate, heterogeneous data set from the darpa urban challenge. Int. J. Robot. Res. 29, 1595\u20131601 (2010). https:\/\/doi.org\/10.1177\/2F0278364910384295","journal-title":"Int. J. Robot. Res."},{"key":"2702_CR188","doi-asserted-by":"publisher","first-page":"1543","DOI":"10.1177\/0278364911400640","volume":"30","author":"G Pandey","year":"2011","unstructured":"Pandey, G., McBride, J., Eustice, R.: Ford campus vision and lidar data set. Int. J. Robot. Res. 30, 1543\u20131552 (2011)","journal-title":"Int. J. Robot. Res."},{"key":"2702_CR189","doi-asserted-by":"publisher","unstructured":"Engel, J., Usenko, V., Cremers, D.: A photometrically calibrated benchmark for monocular visual odometry. arXiv:1607.02555 (2016). https:\/\/doi.org\/10.1177\/2F0278364911400640","DOI":"10.1177\/2F0278364911400640"},{"key":"2702_CR190","unstructured":"Dosovitskiy, A., Ros, G., Codevilla, F., L\u00f3pez, A., Koltun, V.: Carla: An open urban driving simulator. arXiv:1711.03938 (2017)"},{"key":"2702_CR191","unstructured":"Li, W., Saeedi, S., McCormac, J., Clark, R., Tzoumanikas, D., Ye, Q., Huang, Y., Tang, R., Leutenegger, S.: Interiornet: Mega-scale multi-sensor photo-realistic indoor scenes dataset. arXiv:1809.00716 (2018)"},{"key":"2702_CR192","doi-asserted-by":"crossref","unstructured":"Kirsanov, P., Gaskarov, A., Konokhov, F., Sofiiuk, K., Vorontsova, A., Slinko, I., Zhukov, D., Bykov, S., Barinova, O., Konushin, A.: Discoman: Dataset of indoor scenes for odometry, mapping and navigation. 2019 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS), 2470\u20132477 (2019)","DOI":"10.1109\/IROS40897.2019.8967921"},{"key":"2702_CR193","doi-asserted-by":"crossref","unstructured":"Wang, W., Zhu, D., Wang, X., Hu, Y., Qiu, Y., Wang, C., Kapoor, A., Scherer, S.: Tartanair: A dataset to push the limits of visual slam. 2020 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS), 4909\u20134916 (2020)","DOI":"10.1109\/IROS45743.2020.9341801"},{"key":"2702_CR194","doi-asserted-by":"crossref","unstructured":"Shah, S., Dey, D., Lovett, C., Kapoor, A.: Airsim: High-fidelity visual and physical simulation for autonomous vehicles. In: FSR (2017)","DOI":"10.1007\/978-3-319-67361-5_40"},{"key":"2702_CR195","unstructured":"Richter, S.R., AlHaija, H.A., Koltun, V.: Enhancing photorealism enhancement. arXiv preprint arXiv:2105.04619 (2021)"},{"key":"2702_CR196","doi-asserted-by":"crossref","unstructured":"Behley, J., Garbade, M., Milioto, A., Quenzel, J., Behnke, S., Stachniss, C., Gall, J.: Semantickitti: A dataset for semantic scene understanding of lidar sequences. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 9297\u20139307 (2019)","DOI":"10.1109\/ICCV.2019.00939"},{"key":"2702_CR197","doi-asserted-by":"crossref","unstructured":"Caesar, H., Bankiti, V., Lang, A.H., Vora, S., Liong, V.E., Xu, Q., Krishnan, A., Pan, Y., Baldan, G., Beijbom, O.: nuscenes: A multimodal dataset for autonomous driving. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 11621\u201311631 (2020)","DOI":"10.1109\/CVPR42600.2020.01164"},{"key":"2702_CR198","doi-asserted-by":"crossref","unstructured":"Sun, P., Kretzschmar, H., Dotiwalla, X., Chouard, A., Patnaik, V., Tsui, P., Guo, J., Zhou, Y., Chai, Y., Caine, B., et al.: Scalability in perception for autonomous driving: Waymo open dataset. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 2446\u20132454 (2020)","DOI":"10.1109\/CVPR42600.2020.00252"},{"key":"2702_CR199","unstructured":"Geyer, J., Kassahun, Y., Mahmudi, M., Ricou, X., Durgesh, R., Chung, A.S., Hauswald, L., Pham, V.H., M\u00fchlegg, M., Dorn, S., et al.: A2d2: Audi autonomous driving dataset. arXiv preprint arXiv:2004.06320 (2020)"}],"container-title":["The Visual Computer"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-022-02702-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00371-022-02702-z\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-022-02702-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,8]],"date-time":"2024-10-08T23:51:36Z","timestamp":1728431496000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00371-022-02702-z"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,11,17]]},"references-count":199,"journal-issue":{"issue":"11","published-print":{"date-parts":[[2023,11]]}},"alternative-id":["2702"],"URL":"https:\/\/doi.org\/10.1007\/s00371-022-02702-z","relation":{},"ISSN":["0178-2789","1432-2315"],"issn-type":[{"value":"0178-2789","type":"print"},{"value":"1432-2315","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,11,17]]},"assertion":[{"value":"4 October 2022","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 November 2022","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declaration"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}