{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,28]],"date-time":"2025-10-28T10:50:30Z","timestamp":1761648630182,"version":"3.40.3"},"publisher-location":"Cham","reference-count":68,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783030110208"},{"type":"electronic","value":"9783030110215"}],"license":[{"start":{"date-parts":[[2019,1,1]],"date-time":"2019-01-01T00:00:00Z","timestamp":1546300800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2019,1,1]],"date-time":"2019-01-01T00:00:00Z","timestamp":1546300800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019]]},"DOI":"10.1007\/978-3-030-11021-5_43","type":"book-chapter","created":{"date-parts":[[2019,1,24]],"date-time":"2019-01-24T04:26:13Z","timestamp":1548303973000},"page":"691-709","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":43,"title":["Every Pixel Counts: Unsupervised Geometry Learning with Holistic 3D Motion Understanding"],"prefix":"10.1007","author":[{"given":"Zhenheng","family":"Yang","sequence":"first","affiliation":[]},{"given":"Peng","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Yang","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Wei","family":"Xu","sequence":"additional","affiliation":[]},{"given":"Ram","family":"Nevatia","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2019,1,23]]},"reference":[{"key":"43_CR1","doi-asserted-by":"crossref","unstructured":"Godard, C., Mac Aodha, O., Brostow, G.J.: Unsupervised monocular depth estimation with left-right consistency (2017)","DOI":"10.1109\/CVPR.2017.699"},{"key":"43_CR2","doi-asserted-by":"crossref","unstructured":"Zhou, T., Brown, M., Snavely, N., Lowe, D.G.: Unsupervised learning of depth and ego-motion from video. In: CVPR (2017)","DOI":"10.1109\/CVPR.2017.700"},{"key":"43_CR3","doi-asserted-by":"crossref","unstructured":"Yang, Z., Wang, P., Xu, W., Zhao, L., Ram, N.: Unsupervised learning of geometry from videos with edge-aware depth-normal consistency. In: AAAI (2018)","DOI":"10.1609\/aaai.v32i1.12257"},{"key":"43_CR4","doi-asserted-by":"crossref","unstructured":"Yang, Z., Wang, P., Wang, Y., Xu, W., Nevatia, R.: LEGO: learning edge with geometry all at once by watching videos. In: CVPR (2018)","DOI":"10.1109\/CVPR.2018.00031"},{"key":"43_CR5","unstructured":"Eigen, D., Puhrsch, C., Fergus, R.: Depth map prediction from a single image using a multi-scale deep network. In: NIPS (2014)"},{"key":"43_CR6","unstructured":"Wu, C., et al.: VisualSFM: a visual structure from motion system (2011)"},{"key":"43_CR7","unstructured":"Vijayanarasimhan, S., Ricco, S., Schmid, C., Sukthankar, R., Fragkiadaki, K.: SfM-Net: learning of structure and motion from video. CoRR abs\/1704.07804 (2017)"},{"key":"43_CR8","doi-asserted-by":"crossref","unstructured":"Wang, Y., Yang, Y., Yang, Z., Wang, P., Zhao, L., Xu, W.: Occlusion aware unsupervised learning of optical flow. In: CVPR (2018)","DOI":"10.1109\/CVPR.2018.00513"},{"issue":"5","key":"43_CR9","doi-asserted-by":"publisher","first-page":"878","DOI":"10.1109\/TPAMI.2007.70752","volume":"30","author":"L Torresani","year":"2008","unstructured":"Torresani, L., Hertzmann, A., Bregler, C.: Nonrigid structure-from-motion: estimating shape and motion with hierarchical priors. IEEE Trans. Pattern Anal. Mach. Intell. 30(5), 878\u2013892 (2008)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"43_CR10","doi-asserted-by":"crossref","unstructured":"Geiger, A., Lenz, P., Urtasun, R.: Are we ready for autonomous driving? The KITTI vision benchmark suite. In: CVPR (2012)","DOI":"10.1109\/CVPR.2012.6248074"},{"key":"43_CR11","first-page":"1","volume":"11","author":"M Bleyer","year":"2011","unstructured":"Bleyer, M., Rhemann, C., Rother, C.: PatchMatch stereo-stereo matching with slanted support windows. BMVC 11, 1\u201311 (2011)","journal-title":"BMVC"},{"issue":"5","key":"43_CR12","doi-asserted-by":"publisher","first-page":"1147","DOI":"10.1109\/TRO.2015.2463671","volume":"31","author":"R Mur-Artal","year":"2015","unstructured":"Mur-Artal, R., Montiel, J.M.M., Tardos, J.D.: ORB-SLAM: a versatile and accurate monocular slam system. IEEE Trans. Robot. 31(5), 1147\u20131163 (2015)","journal-title":"IEEE Trans. Robot."},{"key":"43_CR13","doi-asserted-by":"crossref","unstructured":"Engel, J., Sch\u00f6ps, T., Cremers, D.: LSD-SLAM: large-scale direct monocular slam. In: ECCV (2014)","DOI":"10.1007\/978-3-319-10605-2_54"},{"key":"43_CR14","doi-asserted-by":"crossref","unstructured":"Newcombe, R.A., Lovegrove, S., Davison, A.J.: DTAM: dense tracking and mapping in real-time. In: ICCV (2011)","DOI":"10.1109\/ICCV.2011.6126513"},{"issue":"2","key":"43_CR15","doi-asserted-by":"publisher","first-page":"101","DOI":"10.1007\/s11263-013-0684-2","volume":"107","author":"Y Dai","year":"2014","unstructured":"Dai, Y., Li, H., He, M.: A simple prior-free method for non-rigid structure-from-motion factorization. Int. J. Comput. Vis. 107(2), 101\u2013122 (2014)","journal-title":"Int. J. Comput. Vis."},{"key":"43_CR16","doi-asserted-by":"crossref","unstructured":"Taylor, J., Jepson, A.D., Kutulakos, K.N.: Non-rigid structure from locally-rigid motion. In: 2010 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 2761\u20132768. IEEE (2010)","DOI":"10.1109\/CVPR.2010.5540002"},{"key":"43_CR17","doi-asserted-by":"crossref","unstructured":"Kumar, S., Dai, Y., Li, H.: Monocular dense 3D reconstruction of a complex dynamic scene from two perspective frames. In: ICCV (2017)","DOI":"10.1109\/ICCV.2017.498"},{"key":"43_CR18","doi-asserted-by":"crossref","unstructured":"Kumar, S., Dai, Y., Li, H.: Multi-body non-rigid structure-from-motion. In: 2016 Fourth International Conference on 3D Vision (3DV), pp. 148\u2013156. IEEE (2016)","DOI":"10.1109\/3DV.2016.23"},{"key":"43_CR19","doi-asserted-by":"crossref","unstructured":"Hoiem, D., Efros, A.A., Hebert, M.: Recovering surface layout from an image. In: ICCV (2007)","DOI":"10.1007\/s11263-006-0031-y"},{"key":"43_CR20","doi-asserted-by":"publisher","first-page":"375","DOI":"10.1007\/0-387-28831-7_23","volume-title":"Handbook of Mathematical Models in Computer Vision","author":"E Prados","year":"2006","unstructured":"Prados, E., Faugeras, O.: Shape from shading. In: Paragios, N., Chen, Y., Faugeras, O. (eds.) Handbook of Mathematical Models in Computer Vision, pp. 375\u2013388. Springer, Boston (2006). https:\/\/doi.org\/10.1007\/0-387-28831-7_23"},{"key":"43_CR21","doi-asserted-by":"crossref","unstructured":"Kong, N., Black, M.J.: Intrinsic depth: improving depth transfer with intrinsic images. In: ICCV (2015)","DOI":"10.1109\/ICCV.2015.401"},{"key":"43_CR22","doi-asserted-by":"crossref","unstructured":"Schwing, A.G., Fidler, S., Pollefeys, M., Urtasun, R.: Box in the box: Joint 3D layout and object reasoning from single images. In: ICCV (2013)","DOI":"10.1109\/ICCV.2013.51"},{"key":"43_CR23","doi-asserted-by":"crossref","unstructured":"Srajer, F., Schwing, A.G., Pollefeys, M., Pajdla, T.: Match box: indoor image matching via box-like scene estimation. In: 3DV (2014)","DOI":"10.1109\/3DV.2014.56"},{"key":"43_CR24","doi-asserted-by":"crossref","unstructured":"Wang, X., Fouhey, D., Gupta, A.: Designing deep networks for surface normal estimation. In: CVPR (2015)","DOI":"10.1109\/CVPR.2015.7298652"},{"key":"43_CR25","doi-asserted-by":"crossref","unstructured":"Eigen, D., Fergus, R.: Predicting depth, surface normals and semantic labels with a common multi-scale convolutional architecture. In: ICCV (2015)","DOI":"10.1109\/ICCV.2015.304"},{"key":"43_CR26","doi-asserted-by":"crossref","unstructured":"Laina, I., Rupprecht, C., Belagiannis, V., Tombari, F., Navab, N.: Deeper depth prediction with fully convolutional residual networks. In: 2016 Fourth International Conference on 3D Vision (3DV), pp. 239\u2013248. IEEE (2016)","DOI":"10.1109\/3DV.2016.32"},{"key":"43_CR27","doi-asserted-by":"crossref","unstructured":"Li, J., Klein, R., Yao, A.: A two-streamed network for estimating fine-scaled depth maps from single RGB images. In: ICCV (2017)","DOI":"10.1109\/ICCV.2017.365"},{"issue":"11","key":"43_CR28","doi-asserted-by":"publisher","first-page":"2144","DOI":"10.1109\/TPAMI.2014.2316835","volume":"36","author":"K Karsch","year":"2014","unstructured":"Karsch, K., Liu, C., Kang, S.B.: Depth transfer: depth extraction from video using non-parametric sampling. IEEE Trans. Pattern Anal. Mach. Intell. 36(11), 2144\u20132158 (2014)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"43_CR29","doi-asserted-by":"crossref","unstructured":"Ladicky, L., Shi, J., Pollefeys, M.: Pulling things out of perspective. In: CVPR (2014)","DOI":"10.1109\/CVPR.2014.19"},{"key":"43_CR30","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"468","DOI":"10.1007\/978-3-319-10602-1_31","volume-title":"Computer Vision \u2013 ECCV 2014","author":"L Ladick\u00fd","year":"2014","unstructured":"Ladick\u00fd, L., Zeisl, B., Pollefeys, M.: Discriminatively trained dense surface normal estimation. In: Fleet, D., Pajdla, T., Schiele, B., Tuytelaars, T. (eds.) ECCV 2014. LNCS, vol. 8693, pp. 468\u2013484. Springer, Cham (2014). https:\/\/doi.org\/10.1007\/978-3-319-10602-1_31"},{"key":"43_CR31","unstructured":"Wang, P., Shen, X., Lin, Z., Cohen, S., Price, B.L., Yuille, A.L.: Towards unified depth and semantic prediction from a single image. In: CVPR (2015)"},{"key":"43_CR32","doi-asserted-by":"crossref","unstructured":"Liu, F., Shen, C., Lin, G.: Deep convolutional neural fields for depth estimation from a single image. In: CVPR, June 2015","DOI":"10.1109\/CVPR.2015.7299152"},{"key":"43_CR33","unstructured":"Li, B., Shen, C., Dai, Y., van den Hengel, A., He, M.: Depth and surface normal estimation from monocular images using regression on deep features and hierarchical CRFS. In: CVPR (2015)"},{"key":"43_CR34","unstructured":"Wang, P., Shen, X., Russell, B., Cohen, S., Price, B.L., Yuille, A.L.: SURGE: surface regularized geometry estimation from a single image. In: NIPS (2016)"},{"key":"43_CR35","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"842","DOI":"10.1007\/978-3-319-46493-0_51","volume-title":"Computer Vision \u2013 ECCV 2016","author":"J Xie","year":"2016","unstructured":"Xie, J., Girshick, R., Farhadi, A.: Deep3D: fully automatic 2D-to-3D video conversion with deep convolutional neural networks. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9908, pp. 842\u2013857. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46493-0_51"},{"key":"43_CR36","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"740","DOI":"10.1007\/978-3-319-46484-8_45","volume-title":"Computer Vision \u2013 ECCV 2016","author":"R Garg","year":"2016","unstructured":"Garg, R., Vijay Kumar, B.G., Carneiro, G., Reid, I.: Unsupervised CNN for single view depth estimation: geometry to the rescue. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9912, pp. 740\u2013756. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46484-8_45"},{"key":"43_CR37","doi-asserted-by":"crossref","unstructured":"Wang, C., Buenaposada, J.M., Zhu, R., Lucey, S.: Learning depth from monocular videos using direct methods. In: CVPR (2018)","DOI":"10.1109\/CVPR.2018.00216"},{"key":"43_CR38","doi-asserted-by":"crossref","unstructured":"Li, R., Wang, S., Long, Z., Gu, D.: UnDeepVO: Monocular visual odometry through unsupervised deep learning. In: ICRA (2018)","DOI":"10.1109\/ICRA.2018.8461251"},{"key":"43_CR39","doi-asserted-by":"crossref","unstructured":"Mahjourian, R., Wicke, M., Angelova, A.: Unsupervised learning of depth and ego-motion from monocular video using 3D geometric constraints. arXiv preprint arXiv:1802.05522 (2018)","DOI":"10.1109\/CVPR.2018.00594"},{"key":"43_CR40","doi-asserted-by":"crossref","unstructured":"Yin, Z., Shi, J.: GeoNet: unsupervised learning of dense depth, optical flow and camera pose. arXiv preprint arXiv:1803.02276 (2018)","DOI":"10.1109\/CVPR.2018.00212"},{"issue":"3","key":"43_CR41","doi-asserted-by":"publisher","first-page":"475","DOI":"10.1109\/TPAMI.2005.63","volume":"27","author":"S Vedula","year":"2005","unstructured":"Vedula, S., Rander, P., Collins, R., Kanade, T.: Three-dimensional scene flow. IEEE Trans. Pattern Anal. Mach. Intell. 27(3), 475\u2013480 (2005)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"43_CR42","doi-asserted-by":"crossref","unstructured":"Menze, M., Geiger, A.: Object scene flow for autonomous vehicles. In: CVPR (2015)","DOI":"10.1109\/CVPR.2015.7298925"},{"key":"43_CR43","doi-asserted-by":"crossref","unstructured":"Behl, A., Jafari, O.H., Mustikovela, S.K., Alhaija, H.A., Rother, C., Geiger, A.: Bounding boxes, segmentations and object coordinates: how important is recognition for 3D scene flow estimation in autonomous driving scenarios? In: CVPR, pp. 2574\u20132583 (2017)","DOI":"10.1109\/ICCV.2017.281"},{"key":"43_CR44","doi-asserted-by":"crossref","unstructured":"Vogel, C., Schindler, K., Roth, S.: Piecewise rigid scene flow. In: 2013 IEEE International Conference on Computer Vision (ICCV), pp. 1377\u20131384. IEEE (2013)","DOI":"10.1109\/ICCV.2013.174"},{"key":"43_CR45","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"757","DOI":"10.1007\/978-3-319-46484-8_46","volume-title":"Computer Vision \u2013 ECCV 2016","author":"Z Lv","year":"2016","unstructured":"Lv, Z., Beall, C., Alcantarilla, P.F., Li, F., Kira, Z., Dellaert, F.: A continuous optimization approach for efficient and accurate scene flow. In: Leibe, B., Matas, J., Sebe, N., Welling, M. (eds.) ECCV 2016. LNCS, vol. 9912, pp. 757\u2013773. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-46484-8_46"},{"key":"43_CR46","doi-asserted-by":"crossref","unstructured":"Mayer, N., et al.: A large dataset to train convolutional networks for disparity, optical flow, and scene flow estimation. In: CVPR (2016)","DOI":"10.1109\/CVPR.2016.438"},{"key":"43_CR47","doi-asserted-by":"crossref","unstructured":"Fragkiadaki, K., Arbelaez, P., Felsen, P., Malik, J.: Learning to segment moving objects in videos. In: CVPR, pp. 4083\u20134090 (2015)","DOI":"10.1109\/CVPR.2015.7299035"},{"key":"43_CR48","doi-asserted-by":"crossref","unstructured":"Yoon, J.S., Rameau, F., Kim, J., Lee, S., Shin, S., Kweon, I.S.: Pixel-level matching for video object segmentation using convolutional neural networks. In: 2017 IEEE International Conference on Computer Vision (ICCV), pp. 2186\u20132195. IEEE (2017)","DOI":"10.1109\/ICCV.2017.238"},{"key":"43_CR49","unstructured":"Tokmakov, P., Schmid, C., Alahari, K.: Learning to segment moving objects. arXiv preprint arXiv:1712.01127 (2017)"},{"issue":"1","key":"43_CR50","doi-asserted-by":"publisher","first-page":"20","DOI":"10.1109\/TPAMI.2017.2662005","volume":"40","author":"W Wang","year":"2018","unstructured":"Wang, W., Shen, J., Yang, R., Porikli, F.: Saliency-aware video object segmentation. IEEE Trans. Pattern Anal. Mach. Intell. 40(1), 20\u201333 (2018)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"43_CR51","doi-asserted-by":"crossref","unstructured":"Faktor, A., Irani, M.: Video segmentation by non-local consensus voting. In: BMVC, vol. 2, p. 8 (2014)","DOI":"10.5244\/C.28.21"},{"key":"43_CR52","doi-asserted-by":"crossref","unstructured":"Yang, Z., Gao, J., Nevatia, R.: Spatio-temporal action detection with cascade proposal and location anticipation. arXiv preprint arXiv:1708.00042 (2017)","DOI":"10.5244\/C.31.95"},{"key":"43_CR53","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"282","DOI":"10.1007\/978-3-642-15555-0_21","volume-title":"Computer Vision \u2013 ECCV 2010","author":"T Brox","year":"2010","unstructured":"Brox, T., Malik, J.: Object segmentation by long term analysis of point trajectories. In: Daniilidis, K., Maragos, P., Paragios, N. (eds.) ECCV 2010. LNCS, vol. 6315, pp. 282\u2013295. Springer, Heidelberg (2010). https:\/\/doi.org\/10.1007\/978-3-642-15555-0_21"},{"key":"43_CR54","doi-asserted-by":"crossref","unstructured":"Kim, K., Yang, Z., Masi, I., Nevatia, R., Medioni, G.: Face and body association for video-based face recognition. In: 2018 IEEE Winter Conference on Applications of Computer Vision (WACV), pp. 39\u201348. IEEE (2018)","DOI":"10.1109\/WACV.2018.00011"},{"key":"43_CR55","doi-asserted-by":"crossref","unstructured":"Ilg, E., Mayer, N., Saikia, T., Keuper, M., Dosovitskiy, A., Brox, T.: FlowNet 2.0: evolution of optical flow estimation with deep networks. In: CVPR (2017)","DOI":"10.1109\/CVPR.2017.179"},{"key":"43_CR56","unstructured":"Jaderberg, M., Simonyan, K., Zisserman, A., et al.: Spatial transformer networks. In: Advances in Neural Information Processing Systems, pp. 2017\u20132025 (2015)"},{"issue":"2","key":"43_CR57","doi-asserted-by":"publisher","first-page":"137","DOI":"10.1007\/BF00129684","volume":"9","author":"C Tomasi","year":"1992","unstructured":"Tomasi, C., Kanade, T.: Shape and motion from image streams under orthography: a factorization method. Int. J. Comput. Vis. 9(2), 137\u2013154 (1992)","journal-title":"Int. J. Comput. Vis."},{"issue":"4","key":"43_CR58","doi-asserted-by":"publisher","first-page":"600","DOI":"10.1109\/TIP.2003.819861","volume":"13","author":"Z Wang","year":"2004","unstructured":"Wang, Z., Bovik, A.C., Sheikh, H.R., Simoncelli, E.P.: Image quality assessment: from error visibility to structural similarity. IEEE Trans. Image Process. 13(4), 600\u2013612 (2004)","journal-title":"IEEE Trans. Image Process."},{"issue":"2","key":"43_CR59","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1023\/B:VISI.0000029664.99615.94","volume":"60","author":"DG Lowe","year":"2004","unstructured":"Lowe, D.G.: Distinctive image features from scale-invariant keypoints. Int. J. Comput. Vis. 60(2), 91\u2013110 (2004)","journal-title":"Int. J. Comput. Vis."},{"key":"43_CR60","doi-asserted-by":"crossref","unstructured":"Lowe, D.G.: Object recognition from local scale-invariant features. In: The Proceedings of the Seventh IEEE International Conference on Computer Vision, vol. 2, pp. 1150\u20131157. IEEE (1999)","DOI":"10.1109\/ICCV.1999.790410"},{"key":"43_CR61","doi-asserted-by":"crossref","unstructured":"Sun, D., Yang, X., Liu, M.Y., Kautz, J.: PWC-Net: CNNs for optical flow using pyramid, warping, and cost volume. arXiv preprint arXiv:1709.02371 (2017)","DOI":"10.1109\/CVPR.2018.00931"},{"key":"43_CR62","unstructured":"Simonyan, K., Zisserman, A.: Very deep convolutional networks for large-scale image recognition. arXiv:1409.1556 (2014)"},{"key":"43_CR63","unstructured":"Lee, C.Y., Xie, S., Gallagher, P., Zhang, Z., Tu, Z.: Deeply-supervised nets. In: Artificial Intelligence and Statistics, pp. 562\u2013570 (2015)"},{"key":"43_CR64","unstructured":"Ioffe, S., Szegedy, C.: Batch normalization: accelerating deep network training by reducing internal covariate shift. In: ICML (2015)"},{"key":"43_CR65","unstructured":"Kingma, D., Ba, J.: Adam: a method for stochastic optimization. arXiv preprint arXiv:1412.6980 (2014)"},{"key":"43_CR66","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"234","DOI":"10.1007\/978-3-319-24574-4_28","volume-title":"Medical Image Computing and Computer-Assisted Intervention \u2013 MICCAI 2015","author":"O Ronneberger","year":"2015","unstructured":"Ronneberger, O., Fischer, P., Brox, T.: U-Net: convolutional networks for biomedical image segmentation. In: Navab, N., Hornegger, J., Wells, W.M., Frangi, A.F. (eds.) MICCAI 2015. LNCS, vol. 9351, pp. 234\u2013241. Springer, Cham (2015). https:\/\/doi.org\/10.1007\/978-3-319-24574-4_28"},{"key":"43_CR67","doi-asserted-by":"crossref","unstructured":"Long, J., Shelhamer, E., Darrell, T.: Fully convolutional networks for semantic segmentation. In: CVPR (2015)","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"43_CR68","doi-asserted-by":"crossref","unstructured":"Kuznietsov, Y., Stuckler, J., Leibe, B.: Semi-supervised deep learning for monocular depth map prediction (2017)","DOI":"10.1109\/CVPR.2017.238"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2018 Workshops"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-11021-5_43","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,22]],"date-time":"2023-01-22T01:21:43Z","timestamp":1674350503000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-11021-5_43"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019]]},"ISBN":["9783030110208","9783030110215"],"references-count":68,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-11021-5_43","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2019]]},"assertion":[{"value":"23 January 2019","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Munich","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Germany","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2018","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"8 September 2018","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"14 September 2018","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"15","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2018","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2018.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}