{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T06:10:58Z","timestamp":1760854258953,"version":"3.37.3"},"reference-count":38,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,5,30]],"date-time":"2021-05-30T00:00:00Z","timestamp":1622332800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,5,30]],"date-time":"2021-05-30T00:00:00Z","timestamp":1622332800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,5,30]]},"DOI":"10.1109\/icra48506.2021.9561820","type":"proceedings-article","created":{"date-parts":[[2021,10,20]],"date-time":"2021-10-20T00:28:35Z","timestamp":1634689715000},"page":"5126-5132","source":"Crossref","is-referenced-by-count":6,"title":["MonStereo: When Monocular and Stereo Meet at the Tail of 3D Human Localization"],"prefix":"10.1109","author":[{"given":"Lorenzo","family":"Bertoni","sequence":"first","affiliation":[{"name":"EPFL,Visual Intelligence for Transportation (VITA) lab,Switzerland"}]},{"given":"Sven","family":"Kreiss","sequence":"additional","affiliation":[{"name":"EPFL,Visual Intelligence for Transportation (VITA) lab,Switzerland"}]},{"given":"Taylor","family":"Mordan","sequence":"additional","affiliation":[{"name":"EPFL,Visual Intelligence for Transportation (VITA) lab,Switzerland"}]},{"given":"Alexandre","family":"Alahi","sequence":"additional","affiliation":[{"name":"EPFL,Visual Intelligence for Transportation (VITA) lab,Switzerland"}]}],"member":"263","reference":[{"key":"ref38","first-page":"5574","article-title":"What uncertainties do we need in bayesian deep learning for computer vision?","author":"kendall","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00227"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.236"},{"key":"ref31","first-page":"1929","article-title":"Dropout: a simple way to prevent neural networks from overfitting","volume":"15","author":"srivastava","year":"2014","journal-title":"The Journal of Machine Learning Research"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298800"},{"article-title":"Adam: A method for stochastic optimization","year":"2014","author":"kingma","key":"ref36"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.133"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1016\/j.trc.2021.103067"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2017.7989311"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W18-5446"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00102"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2018.8594049"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2008.4587671"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01225"},{"article-title":"OpenPifPaf: Composite Fields for Semantic Keypoint Detection and Spatio-Temporal Association","year":"2021","author":"kreiss","key":"ref16"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.597"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33018851"},{"key":"ref19","article-title":"Orthographic feature transform for monocular 3d object detection","author":"roddick","year":"2019","journal-title":"The British Machine Vision Conference (BMVC)"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1136\/adc.73.1.17"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA40945.2020.9197069"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00592"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00696"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1177\/0278364913491297"},{"article-title":"Batch normalization: Accelerating deep network training by reducing internal covariate shift","year":"2015","author":"ioffe","key":"ref29"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00864"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP.2008.4712104"},{"key":"ref7","article-title":"Object detection and matching with mobile cameras collaborating with fixed cameras","author":"alahi","year":"2008","journal-title":"Workshop on Multi-camera and Multi-modal Sensor Fusion Algorithms and Applications-M2SFA2 2008"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01214"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/PETS-WINTER.2009.5399487"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1016\/B978-0-12-809276-7.00007-2"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00111"},{"key":"ref22","first-page":"424","article-title":"3d object proposals for accurate object class detection","author":"chen","year":"2015","journal-title":"Advances in neural information processing systems"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00208"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00783"},{"key":"ref23","first-page":"646","article-title":"Stereo vision-based semantic 3d object and ego-motion tracking for autonomous driving","author":"li","year":"2018","journal-title":"the European Conference on Computer Vision (ECCV)"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA40945.2020.9196660"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00780"}],"event":{"name":"2021 IEEE International Conference on Robotics and Automation (ICRA)","start":{"date-parts":[[2021,5,30]]},"location":"Xi'an, China","end":{"date-parts":[[2021,6,5]]}},"container-title":["2021 IEEE International Conference on Robotics and Automation (ICRA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9560720\/9560666\/09561820.pdf?arnumber=9561820","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,8,2]],"date-time":"2022-08-02T23:20:44Z","timestamp":1659482444000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9561820\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,5,30]]},"references-count":38,"URL":"https:\/\/doi.org\/10.1109\/icra48506.2021.9561820","relation":{},"subject":[],"published":{"date-parts":[[2021,5,30]]}}}