{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,28]],"date-time":"2025-10-28T10:50:29Z","timestamp":1761648629780,"version":"3.40.3"},"publisher-location":"Cham","reference-count":64,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783030110086"},{"type":"electronic","value":"9783030110093"}],"license":[{"start":{"date-parts":[[2019,1,1]],"date-time":"2019-01-01T00:00:00Z","timestamp":1546300800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2019,1,1]],"date-time":"2019-01-01T00:00:00Z","timestamp":1546300800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019]]},"DOI":"10.1007\/978-3-030-11009-3_37","type":"book-chapter","created":{"date-parts":[[2019,1,24]],"date-time":"2019-01-24T06:24:44Z","timestamp":1548311084000},"page":"601-618","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":23,"title":["Image-to-Voxel Model Translation with Conditional Adversarial Networks"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-4466-244X","authenticated-orcid":false,"given":"Vladimir A.","family":"Knyaz","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2912-9986","authenticated-orcid":false,"given":"Vladimir V.","family":"Kniaz","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6097-5342","authenticated-orcid":false,"given":"Fabio","family":"Remondino","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2019,1,23]]},"reference":[{"issue":"9","key":"37_CR1","doi-asserted-by":"publisher","first-page":"961","DOI":"10.1007\/s11263-018-1070-x","volume":"126","author":"Hassan Abu Alhaija","year":"2018","unstructured":"Alhaija, H.A., Mustikovela, S.K., Mescheder, L., Geiger, A., Rother, C.: Augmented reality meets computer vision: efficient data generation for urban driving scenes. Int. J. Comput. Vis. (2018). https:\/\/doi.org\/10.1007\/s11263-018-1070-x","journal-title":"International Journal of Computer Vision"},{"key":"37_CR2","doi-asserted-by":"publisher","unstructured":"Balntas, V., Doumanoglou, A., Sahin, C., Sock, J., Kouskouridas, R., Kim, T.: Pose guided RGBD feature learning for 3D object pose estimation. In: 2017 IEEE International Conference on Computer Vision, ICCV 2017, Venice, Italy, 22\u201329 October, pp. 3876\u20133884 (2017). https:\/\/doi.org\/10.1109\/ICCV.2017.416","DOI":"10.1109\/ICCV.2017.416"},{"key":"37_CR3","doi-asserted-by":"crossref","unstructured":"Balntas, V., Doumanoglou, A., Sahin, C., Sock, J., Kouskouridas, R., Kim, T.K.: Pose guided RGBD feature learning for 3D object pose estimation. In: The IEEE International Conference on Computer Vision (ICCV), October 2017","DOI":"10.1109\/ICCV.2017.416"},{"key":"37_CR4","doi-asserted-by":"crossref","unstructured":"Behl, A., Hosseini Jafari, O., Karthik Mustikovela, S., Abu Alhaija, H., Rother, C., Geiger, A.: Bounding boxes, segmentations and object coordinates: how important is recognition for 3D scene flow estimation in autonomous driving scenarios? In: The IEEE International Conference on Computer Vision (ICCV), October 2017","DOI":"10.1109\/ICCV.2017.281"},{"key":"37_CR5","doi-asserted-by":"crossref","unstructured":"Brachmann, E., et al.: DSAC - differentiable RANSAC for camera localization. In: The IEEE Conference on Computer Vision and Pattern Recognition (CVPR), July 2017","DOI":"10.1109\/CVPR.2017.267"},{"key":"37_CR6","doi-asserted-by":"crossref","unstructured":"Brachmann, E., Rother, C.: Learning less is more - 6D camera localization via 3D surface regression. In: The IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2018","DOI":"10.1109\/CVPR.2018.00489"},{"key":"37_CR7","unstructured":"Brock, A., Lim, T., Ritchie, J., Weston, N.: Generative and discriminative voxel modeling with convolutional neural networks. pp. 1\u20139 December 2016. https:\/\/nips.cc\/Conferences\/2016. workshop contribution; Neural Inofrmation Processing Conference : 3D Deep Learning, NIPS; Conference date: 05\u201312-2016 Through 10\u201312-2016"},{"key":"37_CR8","unstructured":"Chang, A.X., et al.: ShapeNet: an information-rich 3D model repository. CoRR abs\/1512.03012 (2015)"},{"key":"37_CR9","doi-asserted-by":"crossref","unstructured":"Choy, C.B., Xu, D., Gwak, J., Chen, K., Savarese, S.: 3D\u2013R2N2: a unified approach for single and multi-view 3D object reconstruction. In: Proceedings of the European Conference on Computer Vision (ECCV) (2016)","DOI":"10.1007\/978-3-319-46484-8_38"},{"key":"37_CR10","doi-asserted-by":"publisher","unstructured":"Doumanoglou, A., Kouskouridas, R., Malassiotis, S., Kim, T.: Recovering 6D object pose and predicting next-best-view in the crowd. In: 2016 IEEE Conference on Computer Vision and Pattern Recognition, CVPR 2016, Las Vegas, NV, USA, 27\u201330 June 2016, pp. 3583\u20133592 (2016). https:\/\/doi.org\/10.1109\/CVPR.2016.390","DOI":"10.1109\/CVPR.2016.390"},{"key":"37_CR11","doi-asserted-by":"crossref","unstructured":"Drost, B., Ulrich, M., Bergmann, P., Hartinger, P., Steger, C.: Introducing MVTec ITODD - a dataset for 3D object recognition in industry. In: The IEEE International Conference on Computer Vision (ICCV) Workshops, October 2017","DOI":"10.1109\/ICCVW.2017.257"},{"key":"37_CR12","unstructured":"El-Hakim, S.: A flexible approach to 3D reconstruction from single images. In: ACM SIGGRAPH, vol. 1, pp. 12\u201317 (2001)"},{"key":"37_CR13","doi-asserted-by":"crossref","unstructured":"Engel, J., Stueckler, J., Cremers, D.: Large-scale direct slam with stereo cameras (2015)","DOI":"10.1109\/IROS.2015.7353631"},{"issue":"2","key":"37_CR14","doi-asserted-by":"publisher","first-page":"303","DOI":"10.1007\/s11263-009-0275-4","volume":"88","author":"M Everingham","year":"2009","unstructured":"Everingham, M., Van Gool, L., Williams, C.K.I., Winn, J., Zisserman, A.: The pascal visual object classes (VOC) challenge. Int. J. Comput. Vis. 88(2), 303\u2013338 (2009)","journal-title":"Int. J. Comput. Vis."},{"key":"37_CR15","doi-asserted-by":"crossref","unstructured":"Firman, M., Mac Aodha, O., Julier, S., Brostow, G.J.: Structured prediction of unobserved voxels from a single depth image. In: The IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2016","DOI":"10.1109\/CVPR.2016.586"},{"issue":"11","key":"37_CR16","doi-asserted-by":"publisher","first-page":"1231","DOI":"10.1177\/0278364913491297","volume":"32","author":"A Geiger","year":"2013","unstructured":"Geiger, A., Lenz, P., Stiller, C., Urtasun, R.: Vision meets robotics: the KITTI dataset. Int. J. Robot. Res. (IJRR) 32(11), 1231\u20131237 (2013)","journal-title":"Int. J. Robot. Res. (IJRR)"},{"key":"37_CR17","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"484","DOI":"10.1007\/978-3-319-46466-4_29","volume-title":"Computer Vision \u2013 ECCV 2016","author":"R Girdhar","year":"2016","unstructured":"Girdhar, R., Fouhey, D.F., Rodriguez, M., Gupta, A.: Learning a predictable and generative vector representation for objects. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9910, pp. 484\u2013499. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46466-4_29"},{"key":"37_CR18","unstructured":"Goodfellow, I., et al.: Generative adversarial nets. In: Advances in Neural Information Processing Systems, pp. 2672\u20132680 (2014)"},{"key":"37_CR19","doi-asserted-by":"crossref","unstructured":"Heinly, J., Schonberger, J.L., Dunn, E., Frahm, J.M.: Reconstructing the world* in six days *(as captured by the Yahoo 100 million image dataset). In: The IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2015","DOI":"10.1109\/CVPR.2015.7298949"},{"key":"37_CR20","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"548","DOI":"10.1007\/978-3-642-37331-2_42","volume-title":"Computer Vision \u2013 ACCV 2012","author":"S Hinterstoisser","year":"2013","unstructured":"Hinterstoisser, S., et al.: Model based training, detection and pose estimation of texture-less 3D objects in heavily cluttered scenes. In: Lee, K.M., Matsushita, Y., Rehg, J.M., Hu, Z. (eds.) ACCV 2012. LNCS, vol. 7724, pp. 548\u2013562. Springer, Heidelberg (2013). https:\/\/doi.org\/10.1007\/978-3-642-37331-2_42"},{"key":"37_CR21","doi-asserted-by":"crossref","unstructured":"Hoda\u0148, T., Haluza, P., Obdr\u017e\u00e1lek, \u0160., Matas, J., Lourakis, M., Zabulis, X.: T-LESS: an RGB-D dataset for 6D pose estimation of texture-less objects. In: IEEE Winter Conference on Applications of Computer Vision (WACV) (2017)","DOI":"10.1109\/WACV.2017.103"},{"key":"37_CR22","doi-asserted-by":"publisher","unstructured":"Hodan, T., Haluza, P., Obdrz\u00e1lek, S., Matas, J., Lourakis, M.I.A., Zabulis, X.: T-LESS: an RGB-D dataset for 6D pose estimation of texture-less objects. In: 2017 IEEE Winter Conference on Applications of Computer Vision WACV 2017, Santa Rosa, CA, USA, 24\u201331 March 2017, pp. 880\u2013888 (2017). https:\/\/doi.org\/10.1109\/WACV.2017.103","DOI":"10.1109\/WACV.2017.103"},{"key":"37_CR23","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"606","DOI":"10.1007\/978-3-319-49409-8_52","volume-title":"Computer Vision \u2013 ECCV 2016 Workshops","author":"T Hoda\u0148","year":"2016","unstructured":"Hoda\u0148, T., Matas, J., Obdr\u017e\u00e1lek, \u0160.: On evaluation of 6D object pose estimation. In: Hua, G., J\u00e9gou, H. (eds.) ECCV 2016. LNCS, vol. 9915, pp. 606\u2013619. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-49409-8_52"},{"key":"37_CR24","unstructured":"Hoda\u0148, T., Michel, F., Sahin, C., Kim, T.K., Matas, J., Rother, C.: SIXD Challenge 2017. http:\/\/cmp.felk.cvut.cz\/sixd\/challenge_2017\/. Accessed 01 July 2018"},{"key":"37_CR25","doi-asserted-by":"crossref","unstructured":"Hoppe, C., Klopschitz, M., Donoser, M., Bischof, H.: Incremental surface extraction from sparse structure-from-motion point clouds. In: Proceedings of the British Machine Vision Conference 2013, pp. 94:1\u201394:11, British Machine Vision Association (2013)","DOI":"10.5244\/C.27.94"},{"issue":"4","key":"37_CR26","doi-asserted-by":"publisher","first-page":"87:1","DOI":"10.1145\/2766890","volume":"34","author":"Q Huang","year":"2015","unstructured":"Huang, Q., Wang, H., Koltun, V.: Single-view reconstruction via joint analysis of image and shape collections. ACM Trans. Graph. 34(4), 87:1\u201387:10 (2015)","journal-title":"ACM Trans. Graph."},{"key":"37_CR27","doi-asserted-by":"crossref","unstructured":"Isola, P., Zhu, J.Y., Zhou, T., Efros, A.A.: Image-to-image translation with conditional adversarial networks. In: 2017 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 5967\u20135976. IEEE (2017)","DOI":"10.1109\/CVPR.2017.632"},{"key":"37_CR28","doi-asserted-by":"crossref","unstructured":"Kendall, A., Grimes, M., Cipolla, R.: PoseNet: a convolutional network for real-time 6-DOF camera relocalization. In: Proceedings of the IEEE International Conference on Computer Vision, University of Cambridge, Cambridge, United Kingdom, pp. 2938\u20132946. IEEE, February 2015","DOI":"10.1109\/ICCV.2015.336"},{"key":"37_CR29","doi-asserted-by":"publisher","first-page":"63","DOI":"10.5194\/isprsarchives-XLI-B5-63-2016","volume":"XLI-B5","author":"V. V. Kniaz","year":"2016","unstructured":"Kniaz, V.V.: Robust vision-based pose estimation algorithm for an UAV with known gravity vector. ISPRS-Int. Arch. Photogram. Remote Sens. Spat. Inf. Sci. XLI-B5, 63\u201368 (2016). https:\/\/doi.org\/10.5194\/isprs-archives-XLI-B5-63-2016","journal-title":"ISPRS - International Archives of the Photogrammetry, Remote Sensing and Spatial Information Sciences"},{"key":"37_CR30","doi-asserted-by":"publisher","unstructured":"Knyaz, V., Zheltov, S.: Accuracy evaluation of structure from motion surface 3D reconstruction. In: Proceedings of SPIE, vol. 10332, pp. 10332-1\u201310332-10 (2017). https:\/\/doi.org\/10.1117\/12.2272021","DOI":"10.1117\/12.2272021"},{"key":"37_CR31","doi-asserted-by":"publisher","unstructured":"Knyaz, V.A., et al.: Deep learning of convolutional auto-encoder for image matching and 3d object reconstruction in the infrared range. In: The IEEE International Conference on Computer Vision (ICCV) Workshops, pp. 2155\u20132164 (2017). https:\/\/doi.org\/10.1109\/ICCVW.2017.252","DOI":"10.1109\/ICCVW.2017.252"},{"key":"37_CR32","doi-asserted-by":"crossref","unstructured":"Krull, A., Brachmann, E., Nowozin, S., Michel, F., Shotton, J., Rother, C.: PoseAgent: budget-constrained 6d object pose estimation via reinforcement learning. In: The IEEE Conference on Computer Vision and Pattern Recognition (CVPR), July 2017","DOI":"10.1109\/CVPR.2017.275"},{"key":"37_CR33","doi-asserted-by":"crossref","unstructured":"Lim, J.J., Pirsiavash, H., Torralba, A.: Parsing IKEA objects: fine pose estimation. In: ICCV (2013)","DOI":"10.1109\/ICCV.2013.372"},{"key":"37_CR34","doi-asserted-by":"crossref","unstructured":"Long, J., Shelhamer, E., Darrell, T.: Fully convolutional networks for semantic segmentation. In: 2015 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 3431\u20133440. IEEE (2015)","DOI":"10.1109\/CVPR.2015.7298965"},{"issue":"11","key":"37_CR35","first-page":"506","volume":"76","author":"M Ma","year":"2017","unstructured":"Ma, M., Marturi, N., Li, Y., Leonardis, A., Stolkin, R.: Region-sequence based six-stream CNN features for general and fine-grained human action recognition in videos. Pattern Recogn. 76(11), 506\u2013521 (2017)","journal-title":"Pattern Recogn."},{"key":"37_CR36","doi-asserted-by":"crossref","unstructured":"Menze, M., Geiger, A.: Object scene flow for autonomous vehicles. In: CVPR, pp. 3061\u20133070 (2015)","DOI":"10.1109\/CVPR.2015.7298925"},{"key":"37_CR37","unstructured":"Paszke, A., et al.: Automatic differentiation in pyTorch (2017)"},{"key":"37_CR38","doi-asserted-by":"crossref","unstructured":"Poiesi, F., Locher, A., Chippendale, P., Nocerino, E., Remondino, F., Van Gool, L.: Cloud-based collaborative 3D reconstruction using smartphones. In: the 14th ACM European Conference on Visual Media Production (CVMP), pp. 1\u20139. ACM Press, New York (2017)","DOI":"10.1145\/3150165.3150166"},{"key":"37_CR39","doi-asserted-by":"crossref","unstructured":"Qi, C.R., Liu, W., Wu, C., Su, H., Guibas, L.J.: Frustum pointNets for 3D object detection from RGB-D data. arXiv preprint arXiv:1711.08488 (2017)","DOI":"10.1109\/CVPR.2018.00102"},{"key":"37_CR40","doi-asserted-by":"publisher","unstructured":"Rad, M., Lepetit, V.: BB8: a scalable, accurate, robust to partial occlusion method for predicting the 3D poses of challenging objects without using depth. In: IEEE International Conference on Computer Vision, ICCV 2017, Venice, Italy, 22\u201329 October 2017, pp. 3848\u20133856 (2017). https:\/\/doi.org\/10.1109\/ICCV.2017.413","DOI":"10.1109\/ICCV.2017.413"},{"key":"37_CR41","doi-asserted-by":"publisher","first-page":"591","DOI":"10.5194\/isprs-archives-XLII-2-W5-591-2017","volume":"XLII-2\/W5","author":"F. Remondino","year":"2017","unstructured":"Remondino, F., Nocerino, E., Toschi, I., Menna, F.: A critical review of automated photogrammetric processing of large datasets. ISPRS - Int. Arch. Photogram. Remote Sens. Spat. Inf. Sci. 42, 591\u2013599 (2017). XLII-2\/W5. https:\/\/doi.org\/10.5194\/isprs-archives-XLII-2-W5-591-2017","journal-title":"ISPRS - International Archives of the Photogrammetry, Remote Sensing and Spatial Information Sciences"},{"key":"37_CR42","unstructured":"Remondino, F., Roditakis, A.: Human figure reconstruction and modeling from single image or monocular video sequence. In: 2003 Fourth International Conference on 3-D Digital Imaging and Modeling, 3DIM 2003, pp. 116\u2013123. IEEE October 2003"},{"issue":"115","key":"37_CR43","doi-asserted-by":"publisher","first-page":"269","DOI":"10.1111\/j.1477-9730.2006.00383.x","volume":"21","author":"F Remondino","year":"2006","unstructured":"Remondino, F., El-Hakim, S.: Image-based 3D modelling: a review. Photogram. Rec. 21(115), 269\u2013291 (2006)","journal-title":"Photogram. Rec."},{"key":"37_CR44","unstructured":"Richter, S.R., Roth, S.: Matryoshka networks: predicting 3D geometry via nested shape layers. arXiv.org, April 2018"},{"key":"37_CR45","doi-asserted-by":"crossref","unstructured":"Rock, J., Gupta, T., Thorsen, J., Gwak, J., Shin, D., Hoiem, D.: Completing 3D object shape from one depth image. In: 2013 IEEE Conference on Computer Vision and Pattern Recognition, pp. 2484\u20132493. University of Illinois at Urbana-Champaign, Urbana, IEEE, October 2015","DOI":"10.1109\/CVPR.2015.7298863"},{"key":"37_CR46","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"234","DOI":"10.1007\/978-3-319-24574-4_28","volume-title":"Medical Image Computing and Computer-Assisted Intervention \u2013 MICCAI 2015","author":"O Ronneberger","year":"2015","unstructured":"Ronneberger, O., Fischer, P., Brox, T.: U-Net: convolutional networks for biomedical image segmentation. In: Navab, N., Hornegger, J., Wells, W.M., Frangi, A.F. (eds.) MICCAI 2015. LNCS, vol. 9351, pp. 234\u2013241. Springer, Cham (2015). https:\/\/doi.org\/10.1007\/978-3-319-24574-4_28"},{"key":"37_CR47","doi-asserted-by":"crossref","unstructured":"Schonberger, J.L., Frahm, J.M.: Structure-from-motion revisited. In: The IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2016","DOI":"10.1109\/CVPR.2016.445"},{"key":"37_CR48","doi-asserted-by":"crossref","unstructured":"Shin, D., Fowlkes, C., Hoiem, D.: Pixels, voxels, and views: a study of shape representations for single view 3D object shape prediction. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2018)","DOI":"10.1109\/CVPR.2018.00323"},{"key":"37_CR49","doi-asserted-by":"publisher","unstructured":"Shotton, J., Glocker, B., Zach, C., Izadi, S., Criminisi, A., Fitzgibbon, A.: Scene coordinate regression forests for camera relocalization in RGB-D images. In: Proceedings of the 2013 IEEE Conference on Computer Vision and Pattern Recognition, CVPR 2013, pp. 2930\u20132937. IEEE Computer Society, Washington (2013). https:\/\/doi.org\/10.1109\/CVPR.2013.377","DOI":"10.1109\/CVPR.2013.377"},{"key":"37_CR50","unstructured":"Sock, J., Kim, K.I., Sahin, C., Kim, T.K.: Multi-task deep networks for depth-based 6D object pose and joint registration in crowd scenarios. arXiv.org, June 2018"},{"key":"37_CR51","doi-asserted-by":"crossref","unstructured":"Song, S., Yu, F., Zeng, A., Chang, A.X., Savva, M., Funkhouser, T.: Semantic scene completion from a single depth image. In: The IEEE Conference on Computer Vision and Pattern Recognition (CVPR), July 2017","DOI":"10.1109\/CVPR.2017.28"},{"key":"37_CR52","doi-asserted-by":"crossref","unstructured":"Sun, X., et al.: Pix3D: dataset and methods for single-image 3D shape modeling. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2018)","DOI":"10.1109\/CVPR.2018.00314"},{"key":"37_CR53","doi-asserted-by":"crossref","unstructured":"Tatarchenko, M., Dosovitskiy, A., Brox, T.: Multi-view 3D models from single images with a convolutional network. arXiv.org, November 2015","DOI":"10.1007\/978-3-319-46478-7_20"},{"key":"37_CR54","doi-asserted-by":"publisher","first-page":"1097","DOI":"10.5194\/isprs-archives-XLII-2-1097-2018","volume":"XLII-2","author":"Y. Tefera","year":"2018","unstructured":"Tefera, Y., Poiesi, F., Morabito, D., Remondino, F., Nocerino, E., Chippendale, P.: 3DNOW: image-based 3D reconstruction and modeling via web. ISPRS - Int. Arch. Photogram. Remote Sens. Spat. Inf. Sci. 1097\u20131103 (2018). XLII-2. https:\/\/doi.org\/10.5194\/isprs-archives-XLII-2-1097-2018","journal-title":"ISPRS - International Archives of the Photogrammetry, Remote Sensing and Spatial Information Sciences"},{"issue":"1","key":"37_CR55","doi-asserted-by":"publisher","first-page":"119","DOI":"10.1109\/TPAMI.2017.2665623","volume":"40","author":"Alykhan Tejani","year":"2018","unstructured":"Tejani, A., Kouskouridas, R., Doumanoglou, A., Tang, D., Kim, T.: Latent-class hough forests for 6 DoF object pose estimation. IEEE Trans. Pattern Anal. Mach. Intell. 40(1), 119\u2013132 (2018). https:\/\/doi.org\/10.1109\/TPAMI.2017.2665623","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"37_CR56","doi-asserted-by":"crossref","unstructured":"Valentin, J., et al.: Learning to navigate the energy landscape. In: Proceedings - 2016 4th International Conference on 3D Vision, 3DV 2016, University of Oxford, Oxford, United Kingdom, pp. 323\u2013332. IEEE, December 2016","DOI":"10.1109\/3DV.2016.41"},{"key":"37_CR57","doi-asserted-by":"publisher","unstructured":"Walas, K., Nowicki, M., Ferstl, D., Skrzypczynski, P.: Depth data fusion for simultaneous localization and mapping - RGB-DD SLAM. In: 2016 IEEE International Conference on Multisensor Fusion and Integration for Intelligent Systems, MFI 2016, Baden-Baden, Germany, 19\u201321 September 2016, pp. 9\u201314 (2016). https:\/\/doi.org\/10.1109\/MFI.2016.7849459","DOI":"10.1109\/MFI.2016.7849459"},{"key":"37_CR58","unstructured":"Wu, J., Wang, Y., Xue, T., Sun, X., Freeman, W.T., Tenenbaum, J.B.: MarrNet: 3D shape reconstruction via 2.5D sketches. arXiv.org November 2017"},{"key":"37_CR59","unstructured":"Wu, J., Zhang, C., Xue, T., Freeman, B., Tenenbaum, J.: Learning a probabilistic latent space of object shapes via 3D generative-adversarial modeling, pp. 82\u201390 (2016)"},{"key":"37_CR60","doi-asserted-by":"crossref","unstructured":"Xiang, Y., Mottaghi, R., Savarese, S.: Beyond PASCAL: a benchmark for 3D object detection in the wild. In: IEEE Winter Conference on Applications of Computer Vision (WACV) (2014)","DOI":"10.1109\/WACV.2014.6836101"},{"key":"37_CR61","unstructured":"Yan, X., Yang, J., Yumer, E., Guo, Y., Lee, H.: Perspective transformer nets: Learning single-view 3D object reconstruction without 3D supervision (2016). papers.nips.cc"},{"key":"37_CR62","doi-asserted-by":"crossref","unstructured":"Yang, B., Rosa, S., Markham, A., Trigoni, N., Wen, H.: 3D object dense reconstruction from a single depth view. arXiv preprint arXiv:1802.00411 (2018)","DOI":"10.1109\/ICCVW.2017.86"},{"key":"37_CR63","doi-asserted-by":"crossref","unstructured":"Yang, B., Wen, H., Wang, S., Clark, R., Markham, A., Trigoni, N.: 3D object reconstruction from a single depth view with adversarial learning. In: The IEEE International Conference on Computer Vision (ICCV) Workshops, October 2017","DOI":"10.1109\/ICCVW.2017.86"},{"key":"37_CR64","doi-asserted-by":"crossref","unstructured":"Zheng, B., Zhao, Y., Yu, J.C., Ikeuchi, K., Zhu, S.C.: Beyond point clouds: scene understanding by reasoning geometry and physics. In: The IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2013","DOI":"10.1109\/CVPR.2013.402"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2018 Workshops"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-11009-3_37","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,22]],"date-time":"2023-01-22T01:13:07Z","timestamp":1674349987000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-11009-3_37"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019]]},"ISBN":["9783030110086","9783030110093"],"references-count":64,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-11009-3_37","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2019]]},"assertion":[{"value":"23 January 2019","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Munich","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Germany","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2018","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"8 September 2018","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"14 September 2018","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"15","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2018","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2018.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}