{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,15]],"date-time":"2026-04-15T21:48:25Z","timestamp":1776289705115,"version":"3.50.1"},"reference-count":40,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"6","license":[{"start":{"date-parts":[[2017,6,1]],"date-time":"2017-06-01T00:00:00Z","timestamp":1496275200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2017,6,1]],"date-time":"2017-06-01T00:00:00Z","timestamp":1496275200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2017,6,1]],"date-time":"2017-06-01T00:00:00Z","timestamp":1496275200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100006112","name":"Microsoft Research","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100006112","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Pattern Anal. Mach. Intell."],"published-print":{"date-parts":[[2017,6,1]]},"DOI":"10.1109\/tpami.2016.2577031","type":"journal-article","created":{"date-parts":[[2016,6,6]],"date-time":"2016-06-06T14:07:41Z","timestamp":1465222061000},"page":"1137-1149","source":"Crossref","is-referenced-by-count":32324,"title":["Faster R-CNN: Towards Real-Time Object Detection with Region Proposal Networks"],"prefix":"10.1109","volume":"39","author":[{"given":"Shaoqing","family":"Ren","sequence":"first","affiliation":[{"name":"University of Science and Technology of China, Hefei, Anhui, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7318-9658","authenticated-orcid":false,"given":"Kaiming","family":"He","sequence":"additional","affiliation":[{"name":"Visual Computing Group, Microsoft Research, Beijing, China"}]},{"given":"Ross","family":"Girshick","sequence":"additional","affiliation":[{"name":"Facebook AI Research, Seattle, WA 98109"}]},{"given":"Jian","family":"Sun","sequence":"additional","affiliation":[{"name":"Visual Computing Group, Microsoft Research, Beijing, China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10578-9_23"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.169"},{"key":"ref3","article-title":"Very deep convolutional networks for large-scale image recognition","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Simonyan","year":"2015"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-013-0620-5"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.81"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10602-1_26"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2009.167"},{"key":"ref9","article-title":"Overfeat: Integrated recognition, localization and detection using convolutional networks","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Sermanet","year":"2014"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2016.2577031"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-009-0275-4"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"ref13","article-title":"Deep sliding shapes for amodal 3d object detection in RGB-D images","author":"Song","year":"2015","journal-title":"arXiv:1511.02300"},{"key":"ref14","article-title":"DeePM: A deep part-based model for object detection and semantic part localization","author":"Zhu","year":"2015","journal-title":"arXiv:1511.07131"},{"key":"ref15","article-title":"Instance-aware semantic segmentation via multi-task network cascades","author":"Dai","year":"2015","journal-title":"arXiv:1512.04412"},{"key":"ref16","article-title":"Densecap: Fully convolutional localization networks for dense captioning","author":"Johnson","year":"2015","journal-title":"arXiv:1511.07571"},{"key":"ref17","article-title":"Human curation and convnets: Powering item-to-item recommendations on pinterest","author":"Kislyuk","year":"2015","journal-title":"arXiv:1511.04003"},{"key":"ref18","article-title":"Deep residual learning for image recognition","author":"He","year":"2015","journal-title":"arXiv:1512.03385"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.5244\/C.28.24"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2015.2465908"},{"key":"ref21","article-title":"Object-proposal evaluation protocol is \u2019gameable\u2019","author":"Chavali","year":"2015","journal-title":"arXiv: 1505.05836"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2011.231"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.49"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2012.28"},{"key":"ref25","article-title":"Deep neural networks for object detection","volume-title":"Proc. Neural Inform. Process. Syst.","author":"Szegedy","year":"2013"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.276"},{"key":"ref27","article-title":"Scalable, high-quality object detection","author":"Szegedy","year":"2015","journal-title":"arXiv:1412.1441 (v1)"},{"key":"ref28","first-page":"1981","article-title":"Learning to segment object candidates","volume-title":"Proc. Adv. Neural Inform. Process. Syst.","author":"Pinheiro","year":"2015"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7299025"},{"key":"ref30","article-title":"Object detection networks on convolutional feature maps","author":"Ren","year":"2015","journal-title":"arXiv:1504.06066"},{"key":"ref31","first-page":"577","article-title":"Attention-based models for speech recognition","volume-title":"Proc. Adv. Neural Inform. Process. Syst.","author":"Chorowski","year":"2015"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10590-1_53"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.5555\/3104322.3104425"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.4324\/9781410605337-29"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1989.1.4.541"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0816-y"},{"key":"ref37","article-title":"Imagenet classification with deep convolutional neural networks","volume-title":"Proc. Neural Inf. Process. Syst.","author":"Krizhevsky","year":"2012"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1145\/2647868.2654889"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.5244\/C.29.5"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-33712-3_25"}],"container-title":["IEEE Transactions on Pattern Analysis and Machine Intelligence"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/34\/7919342\/07485869.pdf?arnumber=7485869","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,13]],"date-time":"2025-08-13T05:54:48Z","timestamp":1755064488000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/7485869\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,6,1]]},"references-count":40,"journal-issue":{"issue":"6"},"URL":"https:\/\/doi.org\/10.1109\/tpami.2016.2577031","relation":{},"ISSN":["0162-8828","2160-9292","1939-3539"],"issn-type":[{"value":"0162-8828","type":"print"},{"value":"2160-9292","type":"electronic"},{"value":"1939-3539","type":"electronic"}],"subject":[],"published":{"date-parts":[[2017,6,1]]}}}