{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,19]],"date-time":"2025-11-19T06:59:33Z","timestamp":1763535573970,"version":"3.40.3"},"publisher-location":"Cham","reference-count":47,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783030110239"},{"type":"electronic","value":"9783030110246"}],"license":[{"start":{"date-parts":[[2019,1,1]],"date-time":"2019-01-01T00:00:00Z","timestamp":1546300800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2019,1,1]],"date-time":"2019-01-01T00:00:00Z","timestamp":1546300800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019]]},"DOI":"10.1007\/978-3-030-11024-6_2","type":"book-chapter","created":{"date-parts":[[2019,1,24]],"date-time":"2019-01-24T04:29:27Z","timestamp":1548304167000},"page":"15-31","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":12,"title":["Recovering 6D Object Pose: A Review and Multi-modal Analysis"],"prefix":"10.1007","author":[{"given":"Caner","family":"Sahin","sequence":"first","affiliation":[]},{"given":"Tae-Kyun","family":"Kim","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2019,1,23]]},"reference":[{"key":"2_CR1","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"340","DOI":"10.1007\/978-3-642-33712-3_25","volume-title":"Computer Vision \u2013 ECCV 2012","author":"D Hoiem","year":"2012","unstructured":"Hoiem, D., Chodpathumwan, Y., Dai, Q.: Diagnosing error in object detectors. In: Fitzgibbon, A., Lazebnik, S., Perona, P., Sato, Y., Schmid, C. (eds.) ECCV 2012. LNCS, vol. 7574, pp. 340\u2013353. Springer, Heidelberg (2012). https:\/\/doi.org\/10.1007\/978-3-642-33712-3_25"},{"key":"2_CR2","doi-asserted-by":"crossref","unstructured":"Russakovsky, O., Deng, J., Huang, Z., Berg, A.C., Fei-Fei, L.: Detecting avocados to zucchinis: what have we done, and where are we going? In: ICCV (2013)","DOI":"10.1109\/ICCV.2013.258"},{"key":"2_CR3","doi-asserted-by":"crossref","unstructured":"Deng, J., Dong, W., Socher, R., Li, L.J., Li, K., Fei-Fei, L.: Imagenet: a large-scale hierarchical image database. In: CVPR (2009)","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"2_CR4","doi-asserted-by":"publisher","first-page":"303","DOI":"10.1007\/s11263-009-0275-4","volume":"88","author":"M Everingham","year":"2010","unstructured":"Everingham, M., Gool, L.V., Williams, C.K., Winn, J., Zisserman, A.: The pascal visual object classes (VOC) challenge. IJCV 88, 303\u2013338 (2010)","journal-title":"IJCV"},{"key":"2_CR5","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"548","DOI":"10.1007\/978-3-642-37331-2_42","volume-title":"Computer Vision \u2013 ACCV 2012","author":"S Hinterstoisser","year":"2013","unstructured":"Hinterstoisser, S., et al.: Model based training, detection and pose estimation of texture-less 3D objects in heavily cluttered scenes. In: Lee, K.M., Matsushita, Y., Rehg, J.M., Hu, Z. (eds.) ACCV 2012. LNCS, vol. 7724, pp. 548\u2013562. Springer, Heidelberg (2013). https:\/\/doi.org\/10.1007\/978-3-642-37331-2_42"},{"key":"2_CR6","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"462","DOI":"10.1007\/978-3-319-10599-4_30","volume-title":"Computer Vision \u2013 ECCV 2014","author":"A Tejani","year":"2014","unstructured":"Tejani, A., Tang, D., Kouskouridas, R., Kim, T.-K.: Latent-class hough forests for 3D object detection and pose estimation. In: Fleet, D., Pajdla, T., Schiele, B., Tuytelaars, T. (eds.) ECCV 2014. LNCS, vol. 8694, pp. 462\u2013477. Springer, Cham (2014). https:\/\/doi.org\/10.1007\/978-3-319-10599-4_30"},{"key":"2_CR7","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"536","DOI":"10.1007\/978-3-319-10605-2_35","volume-title":"Computer Vision \u2013 ECCV 2014","author":"E Brachmann","year":"2014","unstructured":"Brachmann, E., Krull, A., Michel, F., Gumhold, S., Shotton, J., Rother, C.: Learning 6D object pose estimation using 3D object coordinates. In: Fleet, D., Pajdla, T., Schiele, B., Tuytelaars, T. (eds.) ECCV 2014. LNCS, vol. 8690, pp. 536\u2013551. Springer, Cham (2014). https:\/\/doi.org\/10.1007\/978-3-319-10605-2_35"},{"key":"2_CR8","doi-asserted-by":"crossref","unstructured":"Eppner, C., et al.: Lessons from the Amazon picking challenge: four aspects of building robotic systems. In: Proceedings of Robotics: Science and Systems (2016)","DOI":"10.24963\/ijcai.2017\/676"},{"key":"2_CR9","doi-asserted-by":"crossref","unstructured":"Jonschkowski, R., Eppner, C., Hofer, S., Martin-Martin, R., Brock, O.: Probabilistic multi-class segmentation for the Amazon picking challenge. In: IROS (2016)","DOI":"10.1109\/IROS.2016.7758087"},{"key":"2_CR10","doi-asserted-by":"publisher","first-page":"172","DOI":"10.1109\/TASE.2016.2600527","volume":"15","author":"N Correll","year":"2016","unstructured":"Correll, N., et al.: Analysis and observations from the first Amazon picking challenge. IEEE Trans. Autom. Sci. Eng. 15, 172\u2013188 (2016)","journal-title":"IEEE Trans. Autom. Sci. Eng."},{"key":"2_CR11","doi-asserted-by":"crossref","unstructured":"Doumanoglou, A., Kouskouridas, R., Malassiotis, S., Kim, T.K.: Recovering 6D object pose and predicting next-best-view in the crowd. In: CVPR (2016)","DOI":"10.1109\/CVPR.2016.390"},{"key":"2_CR12","doi-asserted-by":"crossref","unstructured":"Hodan, T., Haluza, P., Obdrzalek, S., Matas, J., Lourakis, M., Zabulis, X.: T-less: an RGB-D dataset for 6D pose estimation of texture-less objects. In: WACV (2017)","DOI":"10.1109\/WACV.2017.103"},{"key":"2_CR13","doi-asserted-by":"crossref","unstructured":"Drost, B., Ulrich, M., Navab, N., Ilic, S.: Model globally, match locally: efficient and robust 3D object recognition. In: CVPR (2010)","DOI":"10.1109\/CVPR.2010.5540108"},{"key":"2_CR14","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"834","DOI":"10.1007\/978-3-319-46487-9_51","volume-title":"Computer Vision \u2013 ECCV 2016","author":"S Hinterstoisser","year":"2016","unstructured":"Hinterstoisser, S., Lepetit, V., Rajkumar, N., Konolige, K.: Going further with point pair features. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9907, pp. 834\u2013848. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46487-9_51"},{"key":"2_CR15","doi-asserted-by":"crossref","unstructured":"Brachmann, E., Michel, F., Krull, A., Yang, M., Gumhold, S., Rother, C.: Uncertainty-driven 6D pose estimation of objects and scenes from a single RGB image. In: CVPR (2016)","DOI":"10.1109\/CVPR.2016.366"},{"key":"2_CR16","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"205","DOI":"10.1007\/978-3-319-46487-9_13","volume-title":"Computer Vision \u2013 ECCV 2016","author":"W Kehl","year":"2016","unstructured":"Kehl, W., Milletari, F., Tombari, F., Ilic, S., Navab, N.: Deep learning of local RGB-D patches for 3D object detection and 6D pose estimation. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9907, pp. 205\u2013220. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46487-9_13"},{"key":"2_CR17","doi-asserted-by":"crossref","unstructured":"Xiang, Y., Schmidt, T., Narayanan, V., Fox, D.: PoseCNN: a convolutional neural network for 6D object pose estimation in cluttered scenes. arxiv (2017)","DOI":"10.15607\/RSS.2018.XIV.019"},{"key":"2_CR18","doi-asserted-by":"crossref","unstructured":"Kehl, W., Manhardt, F., Tombari, F., Ilic, S., Navab, N.: SSD-6D: making RGB-based 3D detection and 6D pose estimation great again. In: CVPR (2017)","DOI":"10.1109\/ICCV.2017.169"},{"key":"2_CR19","doi-asserted-by":"crossref","unstructured":"Felzenszwalb, P., Girshick, R., McAllester, D., Ramanan, D.: Object detection with discriminatively trained part-based models. In: TPAMI (2010)","DOI":"10.1109\/TPAMI.2009.167"},{"key":"2_CR20","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"836","DOI":"10.1007\/978-3-642-33718-5_60","volume-title":"Computer Vision \u2013 ECCV 2012","author":"H Azizpour","year":"2012","unstructured":"Azizpour, H., Laptev, I.: Object detection using strongly-supervised deformable part models. In: Fitzgibbon, A., Lazebnik, S., Perona, P., Sato, Y., Schmid, C. (eds.) ECCV 2012. LNCS, vol. 7572, pp. 836\u2013849. Springer, Heidelberg (2012). https:\/\/doi.org\/10.1007\/978-3-642-33718-5_60"},{"key":"2_CR21","doi-asserted-by":"crossref","unstructured":"Pepik, B., Stark, M., Gehler, P., Schiele, B.: Teaching 3D geometry to deformable part models. In: CVPR (2012)","DOI":"10.1109\/CVPR.2012.6248075"},{"key":"2_CR22","doi-asserted-by":"crossref","unstructured":"Shrivastava, A., Gupta, A.: Building part-based object detectors via 3D geometry. In: ICCV (2013)","DOI":"10.1109\/ICCV.2013.219"},{"key":"2_CR23","unstructured":"Donahue, J., et al.: DeCAF: a deep convolutional activation feature for generic visual recognition. ICML (2014)"},{"key":"2_CR24","doi-asserted-by":"crossref","unstructured":"Girshick, R., Donahue, J., Darrell, T., Malik, J.: Rich feature hierarchies for accurate object detection and semantic segmentation. In: CVPR (2014)","DOI":"10.1109\/CVPR.2014.81"},{"key":"2_CR25","unstructured":"Sermanet, P., Eigen, D., Zhang, X., Mathieu, M., Fergus, R., LeCun, Y.: OverFeat: integrated recognition, localization and detection using convolutional networks. In: ICLR (2014)"},{"key":"2_CR26","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Spatial pyramid pooling in deep convolutional networks for visual recognition. In: PAMI (2015)","DOI":"10.1109\/TPAMI.2015.2389824"},{"key":"2_CR27","doi-asserted-by":"crossref","unstructured":"Girshick, R.: Fast R-CNN. In: ICCV (2015)","DOI":"10.1109\/ICCV.2015.169"},{"key":"2_CR28","doi-asserted-by":"crossref","unstructured":"Girshick, R., Iandola, F., Darrell, T., Malik, J.: Deformable part models are convolutional neural networks. In: CVPR (2015)","DOI":"10.1109\/CVPR.2015.7298641"},{"key":"2_CR29","doi-asserted-by":"crossref","unstructured":"Divvala, S.K., Hoiem, D., Hays, J.H., Efros, A.A., Hebert, M.: An empirical study of context in object detection. In: CVPR (2009)","DOI":"10.1109\/CVPR.2009.5206532"},{"key":"2_CR30","doi-asserted-by":"crossref","unstructured":"Torralba, A., Efros, A.A.: Unbiased look at dataset bias. In: CVPR (2011)","DOI":"10.1109\/CVPR.2011.5995347"},{"key":"2_CR31","doi-asserted-by":"publisher","first-page":"98","DOI":"10.1007\/s11263-014-0733-5","volume":"111","author":"M Everingham","year":"2015","unstructured":"Everingham, M., Eslami, S.A., Gool, L.V., Williams, C.K., Winn, J., Zisserman, A.: The pascal visual object classes challenge: a retrospective. IJCV 111, 98\u2013136 (2015)","journal-title":"IJCV"},{"key":"2_CR32","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1007\/s11263-015-0816-y","volume":"115","author":"O Russakovsky","year":"2015","unstructured":"Russakovsky, O., et al.: Imagenet large scale visual recognition challenge. IJCV 115, 211\u2013252 (2015)","journal-title":"IJCV"},{"key":"2_CR33","doi-asserted-by":"crossref","unstructured":"Rios-Cabrera, R., Tuytelaars, T.: Discriminatively trained templates for 3D object detection: a real time scalable approach. In: ICCV (2013)","DOI":"10.1109\/ICCV.2013.256"},{"key":"2_CR34","first-page":"951","volume":"31","author":"MY Liu","year":"2012","unstructured":"Liu, M.Y., Tuzel, O., Veeraraghavan, A., Taguchi, Y., Marks, T.K., Chellappa, R.: Fast object localization and pose estimation in heavy clutter for robotic bin picking. IJRR 31, 951\u2013973 (2012)","journal-title":"IJRR"},{"key":"2_CR35","doi-asserted-by":"crossref","unstructured":"Sock, J., Kasaei, S.H., Lopes, L.S., Kim, T.K.: Multi-view 6D object pose estimation and camera motion planning using RGBD images. In: 3rd International Workshop on Recovering 6D Object Pose (2017)","DOI":"10.1109\/ICCVW.2017.260"},{"key":"2_CR36","doi-asserted-by":"crossref","unstructured":"Krull, A., Brachmann, E., Michel, F., Yang, M.Y., Gumhold, S., Rother, C.: Learning analysis-by-synthesis for 6D pose estimation in RGB-D images. In: ICCV (2015)","DOI":"10.1109\/ICCV.2015.115"},{"key":"2_CR37","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"520","DOI":"10.1007\/978-3-319-10605-2_34","volume-title":"Computer Vision \u2013 ECCV 2014","author":"U Bonde","year":"2014","unstructured":"Bonde, U., Badrinarayanan, V., Cipolla, R.: Robust instance recognition in presence of occlusion and clutter. In: Fleet, D., Pajdla, T., Schiele, B., Tuytelaars, T. (eds.) ECCV 2014. LNCS, vol. 8690, pp. 520\u2013535. Springer, Cham (2014). https:\/\/doi.org\/10.1007\/978-3-319-10605-2_34"},{"key":"2_CR38","doi-asserted-by":"crossref","unstructured":"Sahin, C., Kouskouridas, R., Kim, T.K.: Iterative hough forest with histogram of control points for 6 DoF object registration from depth images. In: IROS (2016)","DOI":"10.1109\/IROS.2016.7759605"},{"key":"2_CR39","doi-asserted-by":"publisher","first-page":"38","DOI":"10.1016\/j.imavis.2017.05.005","volume":"63","author":"C Sahin","year":"2017","unstructured":"Sahin, C., Kouskouridas, R., Kim, T.K.: A learning-based variable size part extraction architecture for 6D object pose recovery in depth images. Image Vis. Comput. (IVC) 63, 38\u201350 (2017)","journal-title":"Image Vis. Comput. (IVC)"},{"key":"2_CR40","doi-asserted-by":"crossref","unstructured":"Michel, F., et al.: Global hypothesis generation for 6D object pose estimation. In: CVPR (2017)","DOI":"10.1109\/CVPR.2017.20"},{"key":"2_CR41","doi-asserted-by":"crossref","unstructured":"Wohlhart, P., Lepetit, V.: Learning descriptors for object recognition and 3D pose estimation. In: CVPR (2015)","DOI":"10.1109\/CVPR.2015.7298930"},{"key":"2_CR42","doi-asserted-by":"crossref","unstructured":"Balntas, V., Doumanoglou, A., Sahin, C., Sock, J., Kouskouridas, R., Kim, T.K.: Pose guided RGBD feature learning for 3D object pose estimation. In: ICCV (2017)","DOI":"10.1109\/ICCV.2017.416"},{"key":"2_CR43","doi-asserted-by":"crossref","unstructured":"Rad, M., Lepetit, V.: BB8: a scalable, accurate, robust to partial occlusion method for predicting the 3D poses of challenging objects without using depth. In: ICCV (2017)","DOI":"10.1109\/ICCV.2017.413"},{"key":"2_CR44","doi-asserted-by":"crossref","unstructured":"Tekin, B., Sinha, S.N., Fua, P.: Real-time seamless single shot 6D object pose prediction. arxiv (2017)","DOI":"10.1109\/CVPR.2018.00038"},{"key":"2_CR45","doi-asserted-by":"crossref","unstructured":"Shotton, J., Glocker, B., Zach, C., Izadi, S., Criminisi, A., Fitzgibbon, A.: Scene coordinate regression forests for camera relocalization in RGB-D images. In: CVPR (2013)","DOI":"10.1109\/CVPR.2013.377"},{"key":"2_CR46","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"606","DOI":"10.1007\/978-3-319-49409-8_52","volume-title":"Computer Vision \u2013 ECCV 2016 Workshops","author":"T Hoda\u0148","year":"2016","unstructured":"Hoda\u0148, T., Matas, J., Obdr\u017e\u00e1lek, \u0160.: On evaluation of 6D object pose estimation. In: Hua, G., J\u00e9gou, H. (eds.) ECCV 2016. LNCS, vol. 9915, pp. 606\u2013619. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-49409-8_52"},{"key":"2_CR47","doi-asserted-by":"crossref","unstructured":"Kehl, W., Tombari, F., Navab, N., Ilic, S., Lepetit, V.: Hashmod: a hashing method for scalable 3D object detection. In: BMVC (2015)","DOI":"10.5244\/C.29.36"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2018 Workshops"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-11024-6_2","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,22]],"date-time":"2023-01-22T01:38:42Z","timestamp":1674351522000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-11024-6_2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019]]},"ISBN":["9783030110239","9783030110246"],"references-count":47,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-11024-6_2","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2019]]},"assertion":[{"value":"23 January 2019","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Munich","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Germany","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2018","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"8 September 2018","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"14 September 2018","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"15","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2018","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2018.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}