{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T07:24:01Z","timestamp":1740122641005,"version":"3.37.3"},"reference-count":50,"publisher":"Springer Science and Business Media LLC","issue":"6","license":[{"start":{"date-parts":[[2020,11,16]],"date-time":"2020-11-16T00:00:00Z","timestamp":1605484800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,11,16]],"date-time":"2020-11-16T00:00:00Z","timestamp":1605484800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Appl Intell"],"published-print":{"date-parts":[[2021,6]]},"DOI":"10.1007\/s10489-020-01982-z","type":"journal-article","created":{"date-parts":[[2020,11,16]],"date-time":"2020-11-16T09:04:53Z","timestamp":1605517493000},"page":"3581-3599","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["Fast, yet robust end-to-end camera pose estimation for robotic applications"],"prefix":"10.1007","volume":"51","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-2932-9091","authenticated-orcid":false,"given":"Zahra","family":"Kamranian","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hamid","family":"Sadeghian","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ahmad Reza","family":"Naghsh Nilchi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mehran","family":"Mehrandezh","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2020,11,16]]},"reference":[{"key":"1982_CR1","doi-asserted-by":"crossref","unstructured":"Bateux Q, Marchand E, Leitner J, Chaumette F, Corke P (2018) Training deep neural networks for visual servoing. In: IEEE international conference on robotics and automation (ICRA), IEEE, pp 1\u20138","DOI":"10.1109\/ICRA.2018.8461068"},{"issue":"3","key":"1982_CR2","doi-asserted-by":"publisher","first-page":"346","DOI":"10.1016\/j.cviu.2007.09.014","volume":"110","author":"H Bay","year":"2008","unstructured":"Bay H, Ess A, Tuytelaars T, Van Gool L (2008) Speeded-up robust features (surf). Comput Vision Image Underst 110(3):346\u2013359","journal-title":"Comput Vision Image Underst"},{"key":"1982_CR3","doi-asserted-by":"crossref","unstructured":"Brachmann E, Krull A, Nowozin S, Shotton J, Michel F, Gumhold S, Rother C (2017) Dsac-differentiable ransac for camera localization. In: Proceedings of the IEEE conference on computer vision and pattern recognition (CVPR), pp 6684\u20136692","DOI":"10.1109\/CVPR.2017.267"},{"key":"1982_CR4","doi-asserted-by":"crossref","unstructured":"Brachmann E, Rother C (2018) Learning less is more-6d camera localization via 3d surface regression. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 4654\u20134662","DOI":"10.1109\/CVPR.2018.00489"},{"key":"1982_CR5","doi-asserted-by":"crossref","unstructured":"Brahmbhatt S, Gu J, Kim K, Hays J, Kautz J (2018) Geometry-aware learning of maps for camera localization. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 2616\u20132625","DOI":"10.1109\/CVPR.2018.00277"},{"key":"1982_CR6","doi-asserted-by":"crossref","unstructured":"Calonder M, Lepetit V, Strecha C, Fua P (2010) Brief: binary robust independent elementary features. In: European conference on computer vision. Springer, New York, pp 778\u2013792","DOI":"10.1007\/978-3-642-15561-1_56"},{"key":"1982_CR7","doi-asserted-by":"crossref","unstructured":"Cavallari T, Golodetz S, Lord N, Valentin J, Prisacariu V, Di Stefano L, Torr PH (2019) Real-time rgb-d camera pose estimation in novel scenes using a relocalisation cascade. IEEE Transactions on Pattern Analysis and Machine Intelligence","DOI":"10.1109\/TPAMI.2019.2915068"},{"key":"1982_CR8","doi-asserted-by":"crossref","unstructured":"Charco JL, Vintimilla BX, Sappa AD (2018) Deep learning based camera pose estimation in multi-view environment. In: 2018 14Th international conference on signal-image technology & internet-based systems (SITIS), IEEE, pp 224\u2013228","DOI":"10.1109\/SITIS.2018.00041"},{"key":"1982_CR9","doi-asserted-by":"crossref","unstructured":"Chatfield K, Simonyan K, Vedaldi A, Zisserman A (2014) Return of the devil in the details:, Delving deep into convolutional nets. arXiv:1405.3531","DOI":"10.5244\/C.28.6"},{"key":"1982_CR10","doi-asserted-by":"crossref","unstructured":"Deng J, Dong W, Socher R, Li LJ, Li K, Fei-Fei L (2009) Imagenet: a large-scale hierarchical image database. In: Computer vision and pattern recognition (CVPR), IEEE, pp 248\u2013255","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"1982_CR11","unstructured":"DeTone D, Malisiewicz T, Rabinovich A (2016) Deep image homography estimation. arXiv:1606.03798"},{"key":"1982_CR12","unstructured":"Francois C (2017) Deep learning with python"},{"issue":"5","key":"1982_CR13","doi-asserted-by":"publisher","first-page":"1188","DOI":"10.1109\/TRO.2012.2197158","volume":"28","author":"D G\u00e1lvez-L\u00f3pez","year":"2012","unstructured":"G\u00e1lvez-L\u00f3pez D, Tardos JD (2012) Bags of binary words for fast place recognition in image sequences. IEEE Trans Robot 28(5):1188\u20131197","journal-title":"IEEE Trans Robot"},{"key":"1982_CR14","doi-asserted-by":"crossref","unstructured":"Glocker B, Izadi S, Shotton J, Criminisi A (2013) Real-time rgb-d camera relocalization. In: IEEE international symposium on mixed and augmented reality (ISMAR), IEEE, pp 173\u2013179","DOI":"10.1109\/ISMAR.2013.6671777"},{"issue":"5","key":"1982_CR15","doi-asserted-by":"publisher","first-page":"571","DOI":"10.1109\/TVCG.2014.2360403","volume":"21","author":"B Glocker","year":"2014","unstructured":"Glocker B, Shotton J, Criminisi A, Izadi S (2014) Real-time rgb-d camera relocalization via randomized ferns for keyframe encoding. IEEE Trans Visualizat Comput Graph 21(5):571\u2013583","journal-title":"IEEE Trans Visualizat Comput Graph"},{"issue":"11","key":"1982_CR16","doi-asserted-by":"publisher","first-page":"2895","DOI":"10.1109\/TVCG.2018.2868533","volume":"24","author":"S Golodetz","year":"2018","unstructured":"Golodetz S, Cavallari T, Lord NA, Prisacariu VA, Murray DW, Torr PH (2018) Collaborative large-scale dense 3d reconstruction with online inter-agent pose optimisation. IEEE Trans Visualizat Comput Graph 24(11):2895\u20132905","journal-title":"IEEE Trans Visualizat Comput Graph"},{"key":"1982_CR17","doi-asserted-by":"crossref","unstructured":"Held D, Thrun S, Savarese S (2016) Learning to track at 100 fps with deep regression networks. In: European conference on computer vision. Springer, New York, pp 749\u2013765","DOI":"10.1007\/978-3-319-46448-0_45"},{"issue":"11","key":"1982_CR18","doi-asserted-by":"publisher","first-page":"1241","DOI":"10.1109\/TVCG.2015.2459891","volume":"21","author":"O K\u00e4hler","year":"2015","unstructured":"K\u00e4hler O, Prisacariu VA, Ren CY, Sun X, Torr P, Murray D (2015) Very high frame rate volumetric integration of depth images on mobile devices. IEEE Trans Visualizat Comput Graph 21 (11):1241\u20131250","journal-title":"IEEE Trans Visualizat Comput Graph"},{"issue":"12","key":"1982_CR19","doi-asserted-by":"publisher","first-page":"5019","DOI":"10.1007\/s10489-018-1221-3","volume":"48","author":"Z Kamranian","year":"2018","unstructured":"Kamranian Z, Nilchi ARN, Monadjemi A, Navab N (2018) Iterative algorithm for interactive co-segmentation using semantic information propagation. Appl Intell 48(12):5019\u20135036","journal-title":"Appl Intell"},{"key":"1982_CR20","doi-asserted-by":"crossref","unstructured":"Kamranian Z, Nilchi ARN, Sadeghian H, Tombari F, Navab N (2019) Joint motion boundary detection and cnn-based feature visualization for video object segmentation. Neural Comput Applic pp 1\u201319","DOI":"10.1007\/s00521-019-04448-7"},{"key":"1982_CR21","doi-asserted-by":"publisher","first-page":"201","DOI":"10.1016\/j.jvcir.2018.05.014","volume":"55","author":"Z Kamranian","year":"2018","unstructured":"Kamranian Z, Tombari F, Nilchi ARN, Monadjemi A, Navab N (2018) Co-segmentation via visualization. J Vis Commun Image Represent 55:201\u2013214","journal-title":"J Vis Commun Image Represent"},{"key":"1982_CR22","doi-asserted-by":"crossref","unstructured":"Kendall A, Cipolla R (2017) Geometric loss functions for camera pose regression with deep learning. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 5974\u20135983","DOI":"10.1109\/CVPR.2017.694"},{"key":"1982_CR23","doi-asserted-by":"crossref","unstructured":"Kendall A, Grimes M, Cipolla R (2015) Posenet: a convolutional network for real-time 6-dof camera relocalization. In: Proceedings of the IEEE international conference on computer vision, pp 2938\u20132946","DOI":"10.1109\/ICCV.2015.336"},{"key":"1982_CR24","unstructured":"Kingma DP, Ba J (2014) Adam: a method for stochastic optimization. arXiv:1412.6980"},{"key":"1982_CR25","doi-asserted-by":"crossref","unstructured":"Konda KR, Memisevic R (2015) Learning visual odometry with a convolutional network. In: VISAPP (1), pp 486\u2013490","DOI":"10.5220\/0005299304860490"},{"key":"1982_CR26","doi-asserted-by":"crossref","unstructured":"Lathuili\u00e8re S, Mesejo P, Alameda-Pineda X, Horaud R (2019) A comprehensive analysis of deep regression. IEEE Trans Pattern Anal Mach Intell","DOI":"10.1109\/TPAMI.2019.2910523"},{"key":"1982_CR27","doi-asserted-by":"crossref","unstructured":"Li Y, Wang G, Ji X, Xiang Y, Fox D (2018) Deepim: deep iterative matching for 6d pose estimation. In: Proceedings of the european conference on computer vision (ECCV), pp 683\u2013698","DOI":"10.1007\/978-3-030-01231-1_42"},{"key":"1982_CR28","doi-asserted-by":"crossref","unstructured":"Lin Y, Liu Z, Huang J, Wang C, Du G, Bai J, Lian S (2019) Deep global-relative networks for end-to-end 6-dof visual localization and odometry. In: Pacific rim international conference on artificial intelligence. Springer, New York, pp 454\u2013467","DOI":"10.1007\/978-3-030-29911-8_35"},{"key":"1982_CR29","doi-asserted-by":"crossref","unstructured":"Liu R, Zhang H, Liu M, Xia X, Hu T (2009) Stereo cameras self-calibration based on sift. In: 2009 international conference on measuring technology and mechatronics automation, IEEE, vol 1, pp 352\u2013355","DOI":"10.1109\/ICMTMA.2009.338"},{"key":"1982_CR30","doi-asserted-by":"crossref","unstructured":"Long J, Shelhamer E, Darrell T (2015) Fully convolutional networks for semantic segmentation. In: Computer vision and pattern recognition (CVPR), conference on, IEEE, pp 3431\u20133440","DOI":"10.1109\/CVPR.2015.7298965"},{"issue":"2","key":"1982_CR31","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1023\/B:VISI.0000029664.99615.94","volume":"60","author":"DG Lowe","year":"2004","unstructured":"Lowe DG (2004) Distinctive image features from scale-invariant keypoints. Int J Comput Vision 60(2):91\u2013110","journal-title":"Int J Comput Vision"},{"key":"1982_CR32","doi-asserted-by":"crossref","unstructured":"Melekhov I, Ylioinas J, Kannala J, Rahtu E (2017) Image-based localization using hourglass networks. In: Proceedings of the IEEE international conference on computer vision workshops, pp 879\u2013886","DOI":"10.1109\/ICCVW.2017.107"},{"key":"1982_CR33","doi-asserted-by":"crossref","unstructured":"Melekhov I, Ylioinas J, Kannala J, Rahtu E (2017) Relative camera pose estimation using convolutional neural networks. In: International conference on advanced concepts for intelligent vision systems. Springer, New York, pp 675\u2013687","DOI":"10.1007\/978-3-319-70353-4_57"},{"issue":"5","key":"1982_CR34","doi-asserted-by":"publisher","first-page":"1147","DOI":"10.1109\/TRO.2015.2463671","volume":"31","author":"R Mur-Artal","year":"2015","unstructured":"Mur-Artal R, Montiel JMM, Tardos JD (2015) Orb-slam: a versatile and accurate monocular slam system. IEEE Trans Robot 31(5):1147\u20131163","journal-title":"IEEE Trans Robot"},{"key":"1982_CR35","doi-asserted-by":"crossref","unstructured":"Noh H, Hong S, Han B (2015) Learning deconvolution network for semantic segmentation. In: Proceedings of the IEEE international conference on computer vision, pp 1520\u20131528","DOI":"10.1109\/ICCV.2015.178"},{"issue":"4","key":"1982_CR36","doi-asserted-by":"publisher","first-page":"4407","DOI":"10.1109\/LRA.2018.2869640","volume":"3","author":"N Radwan","year":"2018","unstructured":"Radwan N, Valada A, Burgard W (2018) Vlocnet++: Deep multitask learning for semantic visual localization and odometry. IEEE Robot Automat Lett 3(4):4407\u20134414","journal-title":"IEEE Robot Automat Lett"},{"key":"1982_CR37","unstructured":"Redmon J, Farhadi A (2018) Yolov3: an incremental improvement arXiv"},{"key":"1982_CR38","doi-asserted-by":"crossref","unstructured":"Rublee E, Rabaud V, Konolige K, Bradski G (2011) Orb: an efficient alternative to sift or surf. In: 2011 international conference on computer vision, Ieee, pp 2564\u20132571","DOI":"10.1109\/ICCV.2011.6126544"},{"key":"1982_CR39","doi-asserted-by":"crossref","unstructured":"Sadeghian H, Villani L, Kamranian Z, Karami A (2015) Visual servoing with safe interaction using image moments. In: IEEE\/RSJ international conference on intelligent robots and systems (IROS), IEEE, pp 5479\u20135485","DOI":"10.1109\/IROS.2015.7354153"},{"key":"1982_CR40","doi-asserted-by":"crossref","unstructured":"Sarlin PE, Cadena C, Siegwart R, Dymczyk M (2019) From coarse to fine: robust hierarchical localization at large scale. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 12716\u201312725","DOI":"10.1109\/CVPR.2019.01300"},{"key":"1982_CR41","doi-asserted-by":"crossref","unstructured":"Schonberger JL, Frahm JM (2016) Structure-from-motion revisited. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 4104\u20134113","DOI":"10.1109\/CVPR.2016.445"},{"key":"1982_CR42","volume-title":"Robotics: modelling, planning and control","author":"B Siciliano","year":"2010","unstructured":"Siciliano B, Sciavicco L, Villani L, Oriolo G (2010) Robotics: modelling, planning and control. Springer Science & Business Media, New York"},{"key":"1982_CR43","unstructured":"Simonyan K, Zisserman A (2014) Very deep convolutional networks for large-scale image recognition. arXiv:1409.1556"},{"issue":"4","key":"1982_CR44","doi-asserted-by":"publisher","first-page":"591","DOI":"10.1109\/TPAMI.2008.111","volume":"31","author":"J Sivic","year":"2008","unstructured":"Sivic J, Zisserman A (2008) Efficient visual search of videos cast as text retrieval. IEEE Trans Pattern Anal Mach Intell 31(4):591\u2013606","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"1982_CR45","unstructured":"Ruiz-del Solar J, Loncomilla P, Soto N (2018) A survey on deep learning methods for robot vision. arXiv:1803.10862"},{"issue":"5","key":"1982_CR46","doi-asserted-by":"publisher","first-page":"815","DOI":"10.1109\/TPAMI.2009.77","volume":"32","author":"E Tola","year":"2009","unstructured":"Tola E, Lepetit V, Fua P (2009) Daisy: an efficient dense descriptor applied to wide-baseline stereo. IEEE Trans Pattern Anal Mach Intell 32(5):815\u2013830","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"1982_CR47","doi-asserted-by":"crossref","unstructured":"Ummenhofer B, Zhou H, Uhrig J, Mayer N, Ilg E, Dosovitskiy A, Brox T (2017) Demon: depth and motion network for learning monocular stereo. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 5038\u20135047","DOI":"10.1109\/CVPR.2017.596"},{"issue":"5","key":"1982_CR48","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/2751556","volume":"34","author":"J Valentin","year":"2015","unstructured":"Valentin J, Vineet V, Cheng MM, Kim D, Shotton J, Kohli P, Nie\u00dfner M., Criminisi A, Izadi S, Torr P (2015) Semanticpaint: interactive 3d labeling and learning at your fingertips. ACM Trans Graph (TOG) 34(5):1\u201317","journal-title":"ACM Trans Graph (TOG)"},{"key":"1982_CR49","doi-asserted-by":"crossref","unstructured":"Wang Z, Dai Z, P\u00f3czos B, Carbonell J (2019) Characterizing and avoiding negative transfer. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 11293\u201311302","DOI":"10.1109\/CVPR.2019.01155"},{"key":"1982_CR50","doi-asserted-by":"crossref","unstructured":"Zhang Y, Wang S, Genlin J (2015) Application of time-varying acceleration coefficients pso to face pose estimation. In: First international conference on information sciences, machinery, materials and energy. Atlantis Press, Paris","DOI":"10.2991\/icismme-15.2015.12"}],"container-title":["Applied Intelligence"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-020-01982-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10489-020-01982-z\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-020-01982-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,5,20]],"date-time":"2021-05-20T08:18:10Z","timestamp":1621498690000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10489-020-01982-z"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,11,16]]},"references-count":50,"journal-issue":{"issue":"6","published-print":{"date-parts":[[2021,6]]}},"alternative-id":["1982"],"URL":"https:\/\/doi.org\/10.1007\/s10489-020-01982-z","relation":{},"ISSN":["0924-669X","1573-7497"],"issn-type":[{"type":"print","value":"0924-669X"},{"type":"electronic","value":"1573-7497"}],"subject":[],"published":{"date-parts":[[2020,11,16]]},"assertion":[{"value":"25 September 2020","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"16 November 2020","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Compliance with Ethical Standards"}},{"value":"The authors declare that they have no conflicts of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"<!--Emphasis Type='Bold' removed-->Conflict of interests"}}]}}