{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2023,12,18]],"date-time":"2023-12-18T17:35:22Z","timestamp":1702920922838},"reference-count":41,"publisher":"Springer Science and Business Media LLC","issue":"7","license":[{"start":{"date-parts":[[2023,3,14]],"date-time":"2023-03-14T00:00:00Z","timestamp":1678752000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,3,14]],"date-time":"2023-03-14T00:00:00Z","timestamp":1678752000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Neural Process Lett"],"published-print":{"date-parts":[[2023,12]]},"DOI":"10.1007\/s11063-023-11215-2","type":"journal-article","created":{"date-parts":[[2023,3,14]],"date-time":"2023-03-14T12:03:39Z","timestamp":1678795419000},"page":"9581-9596","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Estimation of 6D Pose of Objects Based on a Variant Adversarial Autoencoder"],"prefix":"10.1007","volume":"55","author":[{"given":"Dan","family":"Huang","sequence":"first","affiliation":[]},{"given":"Hyemin","family":"Ahn","sequence":"additional","affiliation":[]},{"given":"Shile","family":"Li","sequence":"additional","affiliation":[]},{"given":"Yueming","family":"Hu","sequence":"additional","affiliation":[]},{"given":"Dongheui","family":"Lee","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,3,14]]},"reference":[{"key":"11215_CR1","unstructured":"Makhzani A, Shlens J, Jaitly N, Goodfellow I (2015) Adversarial autoencoders, Computer ence"},{"key":"11215_CR2","doi-asserted-by":"crossref","unstructured":"Yang T-Y , Huang Y-H, Lin Y-Y,Hsiu P-C, Chuang Y-Y (2018) Ssr-net: a compact soft stagewise regression network for age estimation. In: proceedings of IJCAI, vol 5, no 6, p 7","DOI":"10.24963\/ijcai.2018\/150"},{"key":"11215_CR3","doi-asserted-by":"crossref","unstructured":"Yang T-Y, Chen Y-T, Lin Y-Y, Chuang Y-Y (2019) Fsa-net: learning fine-grained structure aggregation for head pose estimation from a single image, In: proceedings of the IEEE conference on computer vision and pattern recognition, pp 1087\u20131096","DOI":"10.1109\/CVPR.2019.00118"},{"key":"11215_CR4","doi-asserted-by":"crossref","unstructured":"Sundermeyer M, Marton Z-C, Durner M, Brucker M, Triebel R (2018) Implicit 3d orientation learning for 6d object detection from rgb images, In: proceedings of the European conference on computer vision (ECCV) , pp 699\u2013715","DOI":"10.1007\/978-3-030-01231-1_43"},{"issue":"2","key":"11215_CR5","doi-asserted-by":"publisher","first-page":"21","DOI":"10.3390\/robotics9020021","volume":"9","author":"Z Makhataeva","year":"2020","unstructured":"Makhataeva Z, Varol HA (2020) Augmented reality for robotics: a review. Robotics 9(2):21","journal-title":"Robotics"},{"key":"11215_CR6","doi-asserted-by":"crossref","unstructured":"Orbik J, Agostini A, Lee D (2021) Inverse reinforcement learning for dexterous hand manipulation, In: 2021 IEEE international conference on development and learning (ICDL). IEEE, pp 1\u20137","DOI":"10.1109\/ICDL49984.2021.9515637"},{"key":"11215_CR7","doi-asserted-by":"crossref","unstructured":"He Y, Sun W, Huang H, Liu J, Fan H, Sun J (2020) Pvn3d: a deep point-wise 3d keypoints voting network for 6dof pose estimation, In: proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 11632\u201311641","DOI":"10.1109\/CVPR42600.2020.01165"},{"key":"11215_CR8","doi-asserted-by":"crossref","unstructured":"Wang C, Mart\u00edn-Mart\u00edn R, Xu D, Lv J, Lu C, Fei-Fei L, Savarese S, Zhu Y (2020) 6-Pack: category-level 6d pose tracker with anchor-based keypoints, In: 2020 IEEE international conference on robotics and automation (ICRA).IEEE, pp 10059\u201310066","DOI":"10.1109\/ICRA40945.2020.9196679"},{"key":"11215_CR9","unstructured":"Gonzalez M, Kacete A, Murienne A, Marchand E (2020) Yoloff: you only learn offsets for robust 6dof object pose estimation,\u201d http:\/\/arxiv.org\/abs\/2002.00911"},{"key":"11215_CR10","unstructured":"Yu X, Schmidt T, Narayanan V, Fox D (2018) Posecnn: a convolutional neural network for 6d object pose estimation in cluttered scenes, In: robotics:science and systems 2018"},{"key":"11215_CR11","doi-asserted-by":"crossref","unstructured":"Tejani A, Tang D, Kouskouridas R, Kim TK (2014) Latent-class hough forests for 3d object detection and pose estimation, In: European conference on computer vision","DOI":"10.1007\/978-3-319-10599-4_30"},{"key":"11215_CR12","doi-asserted-by":"crossref","unstructured":"Kehl W, Milletari F, Tombari F, Ilic S, Navab N (2016) Deep learning of local rgb-d patches for 3d object detection and 6d pose estimation, In: European conference on computer vision","DOI":"10.1007\/978-3-319-46487-9_13"},{"key":"11215_CR13","doi-asserted-by":"crossref","unstructured":"Drost B, Ulrich M, Navab N, Ilic S (2010) Model globally, match locally: Efficient and robust 3d object recognition,\u201d In: computer vision & pattern recognition","DOI":"10.1109\/CVPR.2010.5540108"},{"key":"11215_CR14","doi-asserted-by":"publisher","first-page":"2417","DOI":"10.1007\/s11063-020-10198-8","volume":"51","author":"S Sun","year":"2020","unstructured":"Sun S, Liu R, Du Q, Sun S (2020) Selective embedding with gated fusion for 6d object pose estimation. Neural Process Lett 51:2417\u20132436","journal-title":"Neural Process Lett"},{"issue":"7","key":"11215_CR15","doi-asserted-by":"publisher","first-page":"3952","DOI":"10.1109\/TII.2018.2884211","volume":"15","author":"C Hong","year":"2018","unstructured":"Hong C, Yu J, Zhang J, Jin X, Lee K-H (2018) Multimodal face-pose estimation with multitask manifold deep learning. IEEE Trans Ind Inform 15(7):3952\u20133961","journal-title":"IEEE Trans Ind Inform"},{"issue":"12","key":"11215_CR16","doi-asserted-by":"publisher","first-page":"5659","DOI":"10.1109\/TIP.2015.2487860","volume":"24","author":"C Hong","year":"2015","unstructured":"Hong C, Yu J, Wan J, Tao D, Wang M (2015) Multimodal deep autoencoder for human pose recovery. IEEE Trans Image Process 24(12):5659\u20135670","journal-title":"IEEE Trans Image Process"},{"key":"11215_CR17","doi-asserted-by":"publisher","DOI":"10.1007\/s11063-022-11134-8","author":"S Zhang","year":"2022","unstructured":"Zhang S, Wang T, Cao J, Liu J (2022) Multichannel matrix randomized autoencoder. Neural Process Lett. https:\/\/doi.org\/10.1007\/s11063-022-11134-8","journal-title":"Neural Process Lett"},{"key":"11215_CR18","unstructured":"Li S, Koo S, Lee D (2015) Real-time and model-free object tracking using particle filter with joint color-spatial descriptor, In: 2015 IEEE\/RSJ international conference on intelligent robots and systems (IROS). IEEE, pp 6079\u20136085"},{"key":"11215_CR19","doi-asserted-by":"crossref","unstructured":"Hodan T, Haluza P, Obdr\u017e\u00e1lek \u0160, Matas J, Lourakis M, Zabulis X (2017) T-less: an rgb-d dataset for 6d pose estimation of texture-less objects, In: 2017 IEEE winter conference on applications of computer vision (WACV).IEEE, pp 880\u2013888","DOI":"10.1109\/WACV.2017.103"},{"issue":"3","key":"11215_CR20","doi-asserted-by":"publisher","first-page":"1677","DOI":"10.1007\/s10462-020-09888-5","volume":"54","author":"G Du","year":"2020","unstructured":"Du G, Wang K, Lian S, Zhao K (2020) Vision-based robotic grasping from object localization, object pose estimation to grasp estimation for parallel grippers: a review. Artif Intell Rev 54(3):1677\u20131734","journal-title":"Artif Intell Rev"},{"key":"11215_CR21","doi-asserted-by":"crossref","unstructured":"Zakharov S, Shugurov I, Ilic S (2019) Dpod: 6d pose object detector and refiner, In: proceedings of the IEEE international conference on computer vision, pp 1941\u20131950","DOI":"10.1109\/ICCV.2019.00203"},{"key":"11215_CR22","doi-asserted-by":"crossref","unstructured":"Hu Y, Fua P, Wang W, Salzmann M (2020) Single-stage 6d object pose estimation, In: proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp 2930\u20132939","DOI":"10.1109\/CVPR42600.2020.00300"},{"key":"11215_CR23","doi-asserted-by":"crossref","unstructured":"Tekin B, Sinha SN, Fua P (2018) Real-time seamless single shot 6d object pose prediction, In: proceedings of the IEEE conference on computer vision and pattern recognition, pp 292\u2013301","DOI":"10.1109\/CVPR.2018.00038"},{"key":"11215_CR24","doi-asserted-by":"crossref","unstructured":"Hu Y, Hugonot J, Fua P, Salzmann M (2019) Segmentation-driven 6d object pose estimation, In: proceedings of the IEEE conference on computer vision and pattern recognition, pp 3385\u20133394","DOI":"10.1109\/CVPR.2019.00350"},{"key":"11215_CR25","doi-asserted-by":"crossref","unstructured":"Peng S, Liu Y, Huang Q, Zhou X, Bao H (2019) Pvnet: pixel-wise voting network for 6dof pose estimation, In: 2019 IEEE\/CVF conference on computer vision and pattern recognition (CVPR)","DOI":"10.1109\/CVPR.2019.00469"},{"key":"11215_CR26","doi-asserted-by":"crossref","unstructured":"Wang C, Xu D, Zhu Y, Mart\u00edn-Mart\u00edn R, Lu C, Fei-Fei L, Savarese S (2019) Densefusion: 6d object pose estimation by iterative dense fusion, In: proceedings of the IEEE conference on computer vision and pattern recognition, pp 3343\u20133352","DOI":"10.1109\/CVPR.2019.00346"},{"issue":"18","key":"11215_CR27","doi-asserted-by":"publisher","first-page":"5086","DOI":"10.3390\/s20185086","volume":"20","author":"A Zhu","year":"2020","unstructured":"Zhu A, Yang J, Zhao W, Cao Z (2020) Lrf-net: learning local reference frames for 3d local shape description and matching. Sensors 20(18):5086","journal-title":"Sensors"},{"key":"11215_CR28","unstructured":"Yu X, Zhuang Z, Koniusz P, Li H (2020) 6dof object pose estimation via differentiable proxy voting loss, http:\/\/arxiv.org\/abs\/2002.03923"},{"key":"11215_CR29","doi-asserted-by":"crossref","unstructured":"Mellado N, Aiger D, Mitra NJ (2014) Super 4pcs fast global pointcloud registration via smart indexing, In: computer graphics forum, vol 33, no 5 Wiley Online Library, pp 205\u2013215","DOI":"10.1111\/cgf.12446"},{"issue":"11","key":"11215_CR30","doi-asserted-by":"publisher","first-page":"2241","DOI":"10.1109\/TPAMI.2015.2513405","volume":"38","author":"J Yang","year":"2015","unstructured":"Yang J, Li H, Campbell D, Jia Y (2015) Go-icp: a globally optimal solution to 3d icp point-set registration. IEEE Trans Pattern Anal Mach Intell 38(11):2241\u20132254","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"11215_CR31","doi-asserted-by":"crossref","unstructured":"Gao G, Lauri M, Wang Y, Hu X, Zhang J, Frintrop S (2020) 6d Object pose regression via supervised learning on point clouds, pp 3643\u20133649","DOI":"10.1109\/ICRA40945.2020.9197461"},{"issue":"2","key":"11215_CR32","doi-asserted-by":"publisher","first-page":"563","DOI":"10.1109\/TPAMI.2019.2932058","volume":"44","author":"J Yu","year":"2019","unstructured":"Yu J, Tan M, Zhang H, Rui Y, Tao D (2019) Hierarchical deep click feature prediction for fine-grained image recognition. IEEE Trans Pattern Anal Mach Intell 44(2):563\u2013578","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"11215_CR33","unstructured":"Kingma DP, Ba J, (2014) Adam: a method for stochastic optimization, http:\/\/arxiv.org\/abs\/1412.6980"},{"key":"11215_CR34","first-page":"249","volume":"9","author":"X Glorot","year":"2010","unstructured":"Glorot X, Bengio Y (2010) Understanding the difficulty of training deep feedforward neural networks. J Mach Learn Res 9:249\u2013256","journal-title":"J Mach Learn Res"},{"key":"11215_CR35","doi-asserted-by":"crossref","unstructured":"Hinterstoisser S, Benhimane S, Lepetit V, Fua P, Navab N (2008) Simultaneous recognition and homography extraction of local patches with a simple linear classifier. In: BMVC. Citeseer, pp 1\u201310","DOI":"10.5244\/C.22.10"},{"issue":"1","key":"11215_CR36","doi-asserted-by":"publisher","first-page":"98","DOI":"10.1007\/s11263-014-0733-5","volume":"111","author":"M Everingham","year":"2015","unstructured":"Everingham M, Eslami SA, Van Gool L, Williams CK, Winn J, Zisserman A (2015) The pascal visual object classes challenge: a retrospective. Int J Comput Vis 111(1):98\u2013136","journal-title":"Int J Comput Vis"},{"key":"11215_CR37","doi-asserted-by":"crossref","unstructured":"Drost B, Ulrich M, Navab N, Ilic S, Model globally, match locally: Efficient and robust 3d object recognition, In: (2010) IEEE computer society conference on computer vision and pattern recognition. IEEE, pp 998\u20131005","DOI":"10.1109\/CVPR.2010.5540108"},{"key":"11215_CR38","doi-asserted-by":"crossref","unstructured":"Choi C, Christensen HI (2012) 3d pose estimation of daily objects using an rgb-d camera, In: 2012 IEEE\/RSJ international conference on intelligent robots and systems. IEEE, pp 3342\u20133349","DOI":"10.1109\/IROS.2012.6386067"},{"key":"11215_CR39","doi-asserted-by":"crossref","unstructured":"Shotton J, Glocker B, Zach C, Izadi S, Criminisi A, Fitzgibbon A (2013) Scene coordinate regression forests for camera relocalization in rgb-d images, In: proceedings of the IEEE conference on computer vision and pattern recognition, pp 2930\u20132937","DOI":"10.1109\/CVPR.2013.377"},{"key":"11215_CR40","doi-asserted-by":"crossref","unstructured":"Hoda\u0148 T, Matas J, Obdr\u017e\u00e1lek \u0160 (2016) On evaluation of 6d object pose estimation, In: European conference on computer vision. Springer, pp 606\u2013619","DOI":"10.1007\/978-3-319-49409-8_52"},{"key":"11215_CR41","doi-asserted-by":"crossref","unstructured":"Liu W, Anguelov D, Erhan D, Szegedy C, Reed S, Fu C-Y, Berg AC (2016) Ssd: single shot multibox detector, In: European conference on computer vision. Springer, pp 21\u201337","DOI":"10.1007\/978-3-319-46448-0_2"}],"container-title":["Neural Processing Letters"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11063-023-11215-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11063-023-11215-2\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11063-023-11215-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,11,11]],"date-time":"2023-11-11T17:13:47Z","timestamp":1699722827000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11063-023-11215-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,3,14]]},"references-count":41,"journal-issue":{"issue":"7","published-print":{"date-parts":[[2023,12]]}},"alternative-id":["11215"],"URL":"https:\/\/doi.org\/10.1007\/s11063-023-11215-2","relation":{},"ISSN":["1370-4621","1573-773X"],"issn-type":[{"value":"1370-4621","type":"print"},{"value":"1573-773X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,3,14]]},"assertion":[{"value":"26 February 2023","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"14 March 2023","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}