{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,29]],"date-time":"2025-09-29T08:27:14Z","timestamp":1759134434017},"reference-count":29,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,10]]},"DOI":"10.1109\/iros.2018.8593736","type":"proceedings-article","created":{"date-parts":[[2019,1,24]],"date-time":"2019-01-24T02:33:30Z","timestamp":1548297210000},"page":"355-361","source":"Crossref","is-referenced-by-count":7,"title":["In pixels we trust: From Pixel Labeling to Object Localization and Scene Categorization"],"prefix":"10.1109","author":[{"given":"Carlos","family":"Herranz-Perdiguero","sequence":"first","affiliation":[]},{"given":"Carolina","family":"Redondo-Cabrera","sequence":"additional","affiliation":[]},{"given":"Roberto J.","family":"Lopez-Sastre","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"doi-asserted-by":"publisher","key":"ref10","DOI":"10.1109\/CVPR.2017.660"},{"doi-asserted-by":"publisher","key":"ref11","DOI":"10.1109\/CVPR.2016.645"},{"key":"ref12","article-title":"Very deep convolutional networks for large-scale image recognition","author":"simonyan","year":"2015","journal-title":"International Conference on Learning Representations"},{"key":"ref13","doi-asserted-by":"crossref","DOI":"10.1609\/aaai.v31i1.11226","article-title":"Depth CNNs for RGB-D scene recognition: Learning from scratch better than transferring from RGB-CNNs","author":"song","year":"2017","journal-title":"AAAI"},{"key":"ref14","article-title":"SSD: Single shot multibox detector","author":"liu","year":"2016","journal-title":"ECCV"},{"doi-asserted-by":"publisher","key":"ref15","DOI":"10.1109\/CVPR.2009.5206718"},{"key":"ref16","article-title":"Describing the scene as a whole: Joint object detection, scene classification and semantic segmentation","author":"yao","year":"2012","journal-title":"CVPR"},{"doi-asserted-by":"publisher","key":"ref17","DOI":"10.1109\/CVPR.2013.79"},{"doi-asserted-by":"publisher","key":"ref18","DOI":"10.1007\/s11263-014-0777-6"},{"key":"ref19","article-title":"Learning rich features from RGB-D images for object detection and segmentation","author":"gupta","year":"2014","journal-title":"ECCV"},{"doi-asserted-by":"publisher","key":"ref28","DOI":"10.1109\/TPAMI.2017.2708714"},{"year":"2016","author":"chen","journal-title":"Deeplab Semantic image segmentation with deep convolutional nets atrous convolution and fully connected crfs","key":"ref4"},{"key":"ref27","article-title":"FuseNet: Incorporating depth into semantic segmentation via fusion-based CNN architecture","author":"hazirbas","year":"2016","journal-title":"Asian Conference on Computer Vision (ACCV)"},{"doi-asserted-by":"publisher","key":"ref3","DOI":"10.1109\/IROS.2017.8206470"},{"doi-asserted-by":"publisher","key":"ref6","DOI":"10.1109\/CVPR.2010.5539970"},{"key":"ref29","article-title":"RGB-D scene labeling: Features and algorithms","author":"ren","year":"2012","journal-title":"CVPR"},{"doi-asserted-by":"publisher","key":"ref5","DOI":"10.1109\/CVPR.2017.690"},{"doi-asserted-by":"publisher","key":"ref8","DOI":"10.1109\/CVPR.2016.90"},{"doi-asserted-by":"publisher","key":"ref7","DOI":"10.1109\/ROBOT.2010.5509682"},{"doi-asserted-by":"publisher","key":"ref2","DOI":"10.1109\/IROS.2017.8202213"},{"key":"ref9","article-title":"Indoor segmentation and support inference from RGBD images","author":"silberman","year":"2012","journal-title":"ECCV"},{"doi-asserted-by":"publisher","key":"ref1","DOI":"10.1109\/IROS.2017.8206396"},{"doi-asserted-by":"publisher","key":"ref20","DOI":"10.1109\/CVPR.2014.81"},{"doi-asserted-by":"publisher","key":"ref22","DOI":"10.1109\/TPAMI.2011.153"},{"doi-asserted-by":"publisher","key":"ref21","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"ref24","article-title":"Microsoft COCO: Common objects in context","author":"lin","year":"2014","journal-title":"ECCV"},{"year":"2014","author":"jia","journal-title":"Caffe Convolutional Architecture for Fast Feature Embedding","key":"ref23"},{"key":"ref26","article-title":"Predicting depth, surface normals and semantic labels with a common multi-scale convolutional architecture","author":"eigen","year":"2014","journal-title":"ICCV"},{"year":"0","author":"everingham","journal-title":"The PASCAL Visual Object Classes Challenge 2012 (VOC2012) Results","key":"ref25"}],"event":{"name":"2018 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)","start":{"date-parts":[[2018,10,1]]},"location":"Madrid","end":{"date-parts":[[2018,10,5]]}},"container-title":["2018 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8574473\/8593358\/08593736.pdf?arnumber=8593736","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,9,10]],"date-time":"2022-09-10T21:04:05Z","timestamp":1662843845000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8593736\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,10]]},"references-count":29,"URL":"https:\/\/doi.org\/10.1109\/iros.2018.8593736","relation":{},"subject":[],"published":{"date-parts":[[2018,10]]}}}