{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,12]],"date-time":"2026-02-12T17:44:07Z","timestamp":1770918247765,"version":"3.50.1"},"reference-count":52,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"funder":[{"name":"ICT Research and Development Program of MSIP\/IITP"},{"name":"Korea Government (MSIT) through the Artificial Intelligence Graduate School Program of Chung-Ang University","award":["2021-0-01341"],"award-info":[{"award-number":["2021-0-01341"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Access"],"published-print":{"date-parts":[[2022]]},"DOI":"10.1109\/access.2022.3166928","type":"journal-article","created":{"date-parts":[[2022,4,12]],"date-time":"2022-04-12T19:33:04Z","timestamp":1649791984000},"page":"38742-38749","source":"Crossref","is-referenced-by-count":18,"title":["Pyramid Attention Upsampling Module for Object Detection"],"prefix":"10.1109","volume":"10","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-4773-2914","authenticated-orcid":false,"given":"Hyeokjin","family":"Park","sequence":"first","affiliation":[{"name":"Department of Image, Chung-Ang University, Seoul, South Korea"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8593-7155","authenticated-orcid":false,"given":"Joonki","family":"Paik","sequence":"additional","affiliation":[{"name":"Department of Image, Chung-Ang University, Seoul, South Korea"}]}],"member":"263","reference":[{"key":"ref1","article-title":"TinaFace: Strong but simple baseline for face detection","author":"Zhu","year":"2020","journal-title":"arXiv:2011.13183"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00525"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2018.2859831"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2018.2846405"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01117"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2019.2929949"},{"key":"ref7","first-page":"1097","article-title":"ImageNet classification with deep convolutional neural networks","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"25","author":"Krizhevsky"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0816-y"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00474"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00716"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.195"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.634"},{"issue":"6","key":"ref14","first-page":"33","article-title":"Pyramid methods in image processing","volume":"29","author":"Adelson","year":"1984","journal-title":"RCA Eng."},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.106"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00913"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00720"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01079"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00442"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01228-1_15"},{"key":"ref21","article-title":"DSSD: Deconvolutional single shot detector","author":"Fu","year":"2017","journal-title":"arXiv:1701.06659"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/WACV.2018.00125"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.660"},{"key":"ref24","article-title":"Rethinking atrous convolution for semantic image segmentation","author":"Chen","year":"2017","journal-title":"arXiv:1706.05587"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00953"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.81"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.169"},{"key":"ref28","first-page":"91","article-title":"Faster R-CNN: Towards real-time object detection with region proposal networks","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"28","author":"Ren"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.322"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00644"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00091"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.91"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.l007\/978-3-319-46448-0_2"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.324"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00667"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01264-9_45"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00978"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00972"},{"key":"ref39","first-page":"5998","article-title":"Attention is all you need","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Vaswani"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"ref42","first-page":"10347","article-title":"Training data-efficient image transformers & distillation through attention","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Touvron"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01009"},{"key":"ref44","article-title":"An image is worth $16\\times16$\n words: Transformers for image recognition at scale","author":"Dosovitskiy","year":"2020","journal-title":"arXiv:2010.11929"},{"key":"ref45","first-page":"1691","article-title":"Generative pretraining from pixels","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Chen"},{"key":"ref46","first-page":"4055","article-title":"Image transformer","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Parmar"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.39"},{"key":"ref48","article-title":"Pyramid attention network for semantic segmentation","author":"Li","year":"2018","journal-title":"arXiv:1805.10180"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-018-1101-7"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2018.2865280"},{"key":"ref51","article-title":"Deformable DETR: Deformable transformers for end-to-end object detection","author":"Zhu","year":"2020","journal-title":"arXiv:2010.04159"},{"key":"ref52","article-title":"MMDetection: Open MMLab detection toolbox and benchmark","author":"Chen","year":"2019","journal-title":"arXiv:1906.07155"}],"container-title":["IEEE Access"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6287639\/9668973\/09756022.pdf?arnumber=9756022","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,22]],"date-time":"2024-01-22T21:08:46Z","timestamp":1705957726000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9756022\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022]]},"references-count":52,"URL":"https:\/\/doi.org\/10.1109\/access.2022.3166928","relation":{},"ISSN":["2169-3536"],"issn-type":[{"value":"2169-3536","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022]]}}}