{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,7,1]],"date-time":"2026-07-01T06:36:51Z","timestamp":1782887811731,"version":"3.54.5"},"reference-count":41,"publisher":"Springer Science and Business Media LLC","issue":"9","license":[{"start":{"date-parts":[[2018,5,12]],"date-time":"2018-05-12T00:00:00Z","timestamp":1526083200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0"}],"funder":[{"DOI":"10.13039\/501100000781","name":"European Research Council","doi-asserted-by":"publisher","award":["StG-2013-335373"],"award-info":[{"award-number":["StG-2013-335373"]}],"id":[{"id":"10.13039\/501100000781","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100000266","name":"Engineering and Physical Sciences Research Council","doi-asserted-by":"publisher","award":["EP\/M013685\/1"],"award-info":[{"award-number":["EP\/M013685\/1"]}],"id":[{"id":"10.13039\/501100000266","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Vis Comput"],"published-print":{"date-parts":[[2018,9]]},"DOI":"10.1007\/s00371-018-1551-5","type":"journal-article","created":{"date-parts":[[2018,5,12]],"date-time":"2018-05-12T06:08:58Z","timestamp":1526105338000},"page":"1165-1176","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":7,"title":["DepthCut: improved depth edge estimation using multiple unreliable channels"],"prefix":"10.1007","volume":"34","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-7568-2849","authenticated-orcid":false,"given":"Paul","family":"Guerrero","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Holger","family":"Winnem\u00f6ller","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Wilmot","family":"Li","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Niloy J.","family":"Mitra","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2018,5,12]]},"reference":[{"key":"1551_CR1","unstructured":"Amer, M.R., Raich, R., Todorovic, S.: Monocular extraction of 2.1d sketch. In: ICIP (2010)"},{"issue":"5","key":"1551_CR2","doi-asserted-by":"publisher","first-page":"898","DOI":"10.1109\/TPAMI.2010.161","volume":"33","author":"P Arbel\u00e1ez","year":"2011","unstructured":"Arbel\u00e1ez, P., Maire, M., Fowlkes, C., Malik, J.: Contour detection and hierarchical image segmentation. IEEE PAMI 33(5), 898\u2013916 (2011)","journal-title":"IEEE PAMI"},{"key":"1551_CR3","unstructured":"Bakry, A., Elhoseiny, M., El-Gaaly, T., Elgammal, A.M.: Digging deep into the layers of cnns (2015). CoRR arXiv:1508.01983"},{"key":"1551_CR4","doi-asserted-by":"crossref","unstructured":"Bansal, A., Kowdle, A., Parikh, D., Gallagher, A., Zitnick, L.: Which edges matter? In: IEEE ICCV (2013)","DOI":"10.1109\/ICCVW.2013.80"},{"key":"1551_CR5","doi-asserted-by":"crossref","unstructured":"Boulch, A., Marlet, R.: Deep learning for robust normal estimation in unstructured point clouds. In: SGP (2016)","DOI":"10.1111\/cgf.12983"},{"key":"1551_CR6","unstructured":"Chakrabarti, A., Shao, J., Shakhnarovich, G.: Depth from a single image by harmonizing overcomplete local network predictions. In: NIPS, pp. 2658\u20132666 (2016)"},{"key":"1551_CR7","doi-asserted-by":"publisher","first-page":"42","DOI":"10.1016\/j.cviu.2012.10.001","volume":"117","author":"X Chen","year":"2013","unstructured":"Chen, X., Li, Q., Zhao, D., Zhao, Q.: Occlusion cues for image scene layering. Comput. Vis. Image Underst. 117, 42\u201355 (2013)","journal-title":"Comput. Vis. Image Underst."},{"key":"1551_CR8","unstructured":"Couprie, C., Farabet, C., Najman, L., LeCun, Y.: Indoor semantic segmentation using depth information (2013). CoRR arXiv:1301.3572"},{"issue":"12","key":"1551_CR9","doi-asserted-by":"publisher","first-page":"1181","DOI":"10.1007\/s00371-011-0667-7","volume":"28","author":"MJ Dahan","year":"2012","unstructured":"Dahan, M.J., Chen, N., Shamir, A., Cohen-Or, D.: Combining color and depth for enhanced image segmentation and retargeting. TVCJ 28(12), 1181\u20131193 (2012)","journal-title":"TVCJ"},{"key":"1551_CR10","unstructured":"Eigen, D., Fergus, R.: Predicting depth, surface normals and semantic labels with a common multi-scale convolutional architecture (2014). CoRR arXiv:1411.4734"},{"issue":"6","key":"1551_CR11","doi-asserted-by":"publisher","first-page":"135:1","DOI":"10.1145\/2366145.2366154","volume":"31","author":"M Fisher","year":"2012","unstructured":"Fisher, M., Ritchie, D., Savva, M., Funkhouser, T., Hanrahan, P.: Example-based synthesis of 3d object arrangements. ACM TOG 31(6), 135:1\u2013135:11 (2012)","journal-title":"ACM TOG"},{"key":"1551_CR12","volume-title":"The Ecological Approach to Visual Perception","author":"JJ Gibson","year":"1986","unstructured":"Gibson, J.J.: The Ecological Approach to Visual Perception. Routledge, Abingdon (1986)"},{"key":"1551_CR13","doi-asserted-by":"crossref","unstructured":"Gupta, S., Girshick, R.B., Arbel\u00e1ez, P.A., Malik, J.: Learning rich features from rgb-d images for object detection and segmentation. In: ECCV (2014)","DOI":"10.1007\/978-3-319-10584-0_23"},{"key":"1551_CR14","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Delving deep into rectifiers: surpassing human-level performance on imagenet classification. In: IEEE ICCV, pp. 1026\u20131034 (2015)","DOI":"10.1109\/ICCV.2015.123"},{"issue":"5786","key":"1551_CR15","doi-asserted-by":"publisher","first-page":"504","DOI":"10.1126\/science.1127647","volume":"313","author":"GE Hinton","year":"2006","unstructured":"Hinton, G.E., Salakhutdinov, R.R.: Reducing the dimensionality of data with neural networks. Science 313(5786), 504\u2013507 (2006)","journal-title":"Science"},{"key":"1551_CR16","doi-asserted-by":"crossref","unstructured":"Iizuka, S., Endo, Y., Kanamori, Y., Mitani, J., Fukui, Y.: Efficient depth propagation for constructing a layered depth image from a single image. In: CGF, vol. 33, No. 7 (2014)","DOI":"10.1111\/cgf.12496"},{"key":"1551_CR17","unstructured":"Ioffe, S., Szegedy, C.: Batch normalization: accelerating deep network training by reducing internal covariate shift. In: ICML, pp. 448\u2013456 (2015)"},{"key":"1551_CR18","unstructured":"Isola, P., Zhu, J.Y., Zhou, T., Efros, A.A.: Image-to-image translation with conditional adversarial networks (2016). CoRR arXiv:1611.07004"},{"key":"1551_CR19","unstructured":"Kingma, D.P., Ba, J.: Adam: A method for stochastic optimization. In: ICLR (2015)"},{"key":"1551_CR20","doi-asserted-by":"crossref","unstructured":"Kolmogorov, V., Criminisi, A., Blake, A., Cross, G., Rother, C.: Bi-layer segmentation of binocular stereo video. In: IEEE CVPR, vol. 2, pp. 407\u2013414 (2005)","DOI":"10.1109\/CVPR.2005.91"},{"key":"1551_CR21","unstructured":"Krizhevsky, A., Sutskever, I., Hinton, G.E.: Imagenet classification with deep convolutional neural networks. In: NIPS, pp. 1097\u20131105 (2012)"},{"issue":"5","key":"1551_CR22","doi-asserted-by":"publisher","first-page":"530","DOI":"10.1109\/TPAMI.2004.1273918","volume":"26","author":"DR Martin","year":"2004","unstructured":"Martin, D.R., Fowlkes, C.C., Malik, J.: Learning to detect natural image boundaries using local brightness, color, and texture cues. IEEE PAMI 26(5), 530\u2013549 (2004)","journal-title":"IEEE PAMI"},{"key":"1551_CR23","doi-asserted-by":"crossref","unstructured":"Mayer, N., Ilg, E., Hausser, P., Fischer, P., Cremers, D., Dosovitskiy, A., Brox, T.: A large dataset to train convolutional networks for disparity, optical flow, and scene flow estimation. In: IEEE CVPR, pp. 4040\u20134048 (2016)","DOI":"10.1109\/CVPR.2016.438"},{"issue":"3","key":"1551_CR24","doi-asserted-by":"publisher","first-page":"84:1","DOI":"10.1145\/1531326.1531390","volume":"28","author":"J McCann","year":"2009","unstructured":"McCann, J., Pollard, N.: Local layering. ACM TOG 28(3), 84:1\u201384:7 (2009)","journal-title":"ACM TOG"},{"key":"1551_CR25","unstructured":"McCormac, J., Handa, A., Leutenegger, S., Davison, A.J.: Scenenet RGB-D: 5m photorealistic images of synthetic indoor trajectories with ground truth (2016). CoRR arXiv:1612.05079"},{"key":"1551_CR26","doi-asserted-by":"crossref","unstructured":"Mitra, N.J., Wand, M., Zhang, H., Cohen-Or, D., Kim, V., Huang, Q.X.: Structure-aware shape processing. In: ACM SIGGRAPH 2014 Courses, pp. 13:1\u201313:21 (2014)","DOI":"10.1145\/2614028.2615401"},{"key":"1551_CR27","doi-asserted-by":"crossref","unstructured":"Nitzberg, M., Mumford, D.: The 2.1-d sketch. In: IEEE ICCV, pp. 138\u2013144 (1990)","DOI":"10.1109\/ICCV.1990.139511"},{"key":"1551_CR28","unstructured":"Ren, X., Bo, L.: Discriminatively trained sparse code gradients for contour detection. In: NIPS (2012)"},{"key":"1551_CR29","doi-asserted-by":"crossref","unstructured":"Ronneberger, O., Fischer, P., Brox, T.: U-Net: convolutional networks for biomedical image segmentation. In: MICCAI, pp. 234\u2013241 (2015)","DOI":"10.1007\/978-3-319-24574-4_28"},{"issue":"3","key":"1551_CR30","doi-asserted-by":"publisher","first-page":"309","DOI":"10.1145\/1015706.1015720","volume":"23","author":"C Rother","year":"2004","unstructured":"Rother, C., Kolmogorov, V., Blake, A.: grabcut: interactive foreground extraction using iterated graph cuts. ACM TOG 23(3), 309\u2013314 (2004)","journal-title":"ACM TOG"},{"key":"1551_CR31","doi-asserted-by":"crossref","unstructured":"Scharstein, D., Hirschmller, H., Kitajima, Y., Krathwohl, G., Nesic, N., Wang, X., Westling, P.: High-resolution stereo datasets with subpixel-accurate ground truth. In: GCPR, Lecture Notes in Computer Science, vol. 8753, pp. 31\u201342. Springer, Berlin (2014)","DOI":"10.1007\/978-3-319-11752-2_3"},{"key":"1551_CR32","unstructured":"Sermanet, P., Eigen, D., Zhang, X., Mathieu, M., Fergus, R., LeCun, Y.: OverFeat: integrated recognition, localization and detection using convolutional networks (2013). CoRR arXiv:1312.6229"},{"key":"1551_CR33","unstructured":"Simonyan, K., Zisserman, A.: Very deep convolutional networks for large-scale image recognition. In: ICLR (2015)"},{"key":"1551_CR34","doi-asserted-by":"crossref","unstructured":"Song, S., Yu, F., Zeng, A., Chang, A.X., Savva, M., Funkhouser, T.: Semantic scene completion from a single depth image. In: IEEE CVPR (2017)","DOI":"10.1109\/CVPR.2017.28"},{"key":"1551_CR35","doi-asserted-by":"crossref","unstructured":"Sundberg, P., Brox, T., Maire, M., Arbelaez, P., Malik, J.: Occlusion boundary detection and figure\/ground assignment from optical flow. In: IEEE CVPR (2011)","DOI":"10.1109\/CVPR.2011.5995364"},{"key":"1551_CR36","unstructured":"Szegedy, C., Toshev, A., Erhan, D.: Deep neural networks for object detection. In: NIPS (2013)"},{"key":"1551_CR37","doi-asserted-by":"crossref","unstructured":"Toshev, A., Szegedy, C.: Deeppose: human pose estimation via deep neural networks. In: IEEE CVPR (2014)","DOI":"10.1109\/CVPR.2014.214"},{"key":"1551_CR38","doi-asserted-by":"crossref","unstructured":"Xu, K., Kim, V.G., Huang, Q., Mitra, N., Kalogerakis, E.: Data-driven shape analysis and processing. In: SIGGRAPH ASIA 2016 Courses, pp. 4:1\u20134:38 (2016)","DOI":"10.1145\/2988458.2988473"},{"issue":"5","key":"1551_CR39","doi-asserted-by":"publisher","first-page":"507","DOI":"10.1016\/j.gmod.2014.03.015","volume":"76","author":"CC Yu","year":"2014","unstructured":"Yu, C.C., Liu, Y.J., Wu, M.T., Li, K.Y., Fu, X.: A global energy optimization framework for 2.1d sketch extraction from monocular images. Graph. Models 76(5), 507\u2013521 (2014). Geometric Modeling and Processing 2014","journal-title":"Graph. Models"},{"issue":"1","key":"1551_CR40","first-page":"2287","volume":"17","author":"J \u017dbontar","year":"2016","unstructured":"\u017dbontar, J., LeCun, Y.: Stereo matching by training a convolutional neural network to compare image patches. J. Mach. Learn. Res. 17(1), 2287\u20132318 (2016)","journal-title":"J. Mach. Learn. Res."},{"key":"1551_CR41","doi-asserted-by":"crossref","unstructured":"Zhu, H., Weibel, J.B., Lu, S.: Discriminative multi-modal feature fusion for rgbd indoor scene recognition. In: IEEE CVPR (2016)","DOI":"10.1109\/CVPR.2016.324"}],"container-title":["The Visual Computer"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s00371-018-1551-5\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-018-1551-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-018-1551-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,4]],"date-time":"2025-07-04T13:17:34Z","timestamp":1751635054000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s00371-018-1551-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,5,12]]},"references-count":41,"journal-issue":{"issue":"9","published-print":{"date-parts":[[2018,9]]}},"alternative-id":["1551"],"URL":"https:\/\/doi.org\/10.1007\/s00371-018-1551-5","relation":{},"ISSN":["0178-2789","1432-2315"],"issn-type":[{"value":"0178-2789","type":"print"},{"value":"1432-2315","type":"electronic"}],"subject":[],"published":{"date-parts":[[2018,5,12]]},"assertion":[{"value":"12 May 2018","order":1,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Compliance with ethical standards"}},{"value":"The authors declare that they have no conflicts of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}