{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,8]],"date-time":"2026-04-08T16:23:40Z","timestamp":1775665420573,"version":"3.50.1"},"reference-count":61,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,6,1]],"date-time":"2021-06-01T00:00:00Z","timestamp":1622505600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,6,1]],"date-time":"2021-06-01T00:00:00Z","timestamp":1622505600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,6]]},"DOI":"10.1109\/cvprw53098.2021.00054","type":"proceedings-article","created":{"date-parts":[[2021,9,1]],"date-time":"2021-09-01T20:57:37Z","timestamp":1630529857000},"page":"433-442","source":"Crossref","is-referenced-by-count":149,"title":["Perceptual Image Quality Assessment with Transformers"],"prefix":"10.1109","author":[{"given":"Manri","family":"Cheon","sequence":"first","affiliation":[{"name":"LG Electronics,Seoul,Korea"}]},{"given":"Sung-Jun","family":"Yoon","sequence":"additional","affiliation":[{"name":"LG Electronics,Seoul,Korea"}]},{"given":"Byungyeon","family":"Kang","sequence":"additional","affiliation":[{"name":"LG Electronics,Seoul,Korea"}]},{"given":"Junwoo","family":"Lee","sequence":"additional","affiliation":[{"name":"LG Electronics,Seoul,Korea"}]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00194"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1016\/j.image.2014.10.009"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/QoMEX.2019.8743252"},{"key":"ref32","doi-asserted-by":"crossref","first-page":"11006","DOI":"10.1117\/1.3267105","article-title":"Most apparent distortion: full-reference image quality assessment and the role of strategy","volume":"19","author":"larson","year":"2010","journal-title":"Journal of Electronic Imaging"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.2352\/ISSN.2470-1173.2016.16.HVEI-103"},{"key":"ref30","article-title":"Colorization transformer","author":"kumar","year":"2021"},{"key":"ref37","first-page":"4055","article-title":"Image transformer","author":"parmar","year":"2018","journal-title":"Int Conf Mach Learn"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2012.2227726"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1016\/j.cviu.2016.12.009"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2011.2175935"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP.2010.5649275"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00068"},{"key":"ref28","article-title":"Adam: A method for stochastic optimization","author":"kingma","year":"2015","journal-title":"Int Conf Learn Represent"},{"key":"ref27","article-title":"Transformers in vision: A survey","author":"khan","year":"2021"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/QoMEX.2016.7498936"},{"key":"ref2","first-page":"1","article-title":"The 2018 PIRM challenge on perceptual image super-resolution","author":"blau","year":"2018","journal-title":"Eur Conf Comput Vis Workshop"},{"key":"ref1","article-title":"Layer normalization","author":"ba","year":"2016"},{"key":"ref20","first-page":"2672","article-title":"Generative adversarial nets","author":"goodfellow","year":"2014","journal-title":"Adv Neural Inform Process Syst"},{"key":"ref22","first-page":"633","article-title":"PIPAL: A large-scale image quality assessment dataset for perceptual image restoration","author":"gu","year":"2020","journal-title":"Eur Conf Comput Vis"},{"key":"ref21","article-title":"Image quality assessment for perceptual image restoration: A new dataset, benchmark and metric","author":"gu","year":"2020"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2020.2967829"},{"key":"ref23","article-title":"NTIRE 2021 challenge on perceptual image quality assessment","author":"gu","year":"2021","journal-title":"IEEE\/CVF Conf Comput Vis Pattern Recog Worksh"},{"key":"ref26","article-title":"Transgan: Two transformers can make one strong gan","author":"jiang","year":"2021"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1016\/j.image.2020.115839"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/97.995823"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2003.819861"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2011.2109730"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2014.2346028"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP.2012.6467149"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1007\/s11432-019-2757-1"},{"key":"ref55","article-title":"Transformer for image quality assessment","author":"you","year":"2020"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00583"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2013.2293423"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/ACSSC.2003.1292216"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1016\/j.image.2021.116150"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TBC.2011.2104671"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2005.859378"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2019.06.103"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/83.841940"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"ref15","article-title":"Bert: Pre-training of deep bidirectional trans-formers for language understanding","author":"devlin","year":"2018"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2020.3045810"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-020-01419-7"},{"key":"ref18","article-title":"An image is worth 16x16 words: Transformers for image recognition at scale","author":"dosovitskiy","year":"2020"},{"key":"ref19","first-page":"3677","article-title":"Perceptual quality assessment of smartphone photography","author":"fang","year":"2020","journal-title":"IEEE Conf Comput Vis Pattern Recog"},{"key":"ref4","first-page":"213","article-title":"End-to-end object detection with transformers","author":"carion","year":"2020","journal-title":"Eur Conf Comput Vis"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2017.2760518"},{"key":"ref6","article-title":"Pre-trained image processing transformer","author":"chen","year":"2020"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2007.901820"},{"key":"ref8","first-page":"1","article-title":"Generative adversarial network-based image super-resolution using perceptual content losses","author":"cheon","year":"2018","journal-title":"Eur Conf Comput Vis Workshop"},{"key":"ref7","first-page":"1691","article-title":"Generative pretraining from pixels","author":"chen","year":"2020","journal-title":"Int Conf Mach Learn"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2011.942295"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2017.2683504"},{"key":"ref46","article-title":"Attention is all you need","author":"vaswani","year":"2017"},{"key":"ref45","article-title":"Training data-efficient image trans-formers & distillation through attention","author":"touvron","year":"2020"},{"key":"ref48","first-page":"1","article-title":"ESRGAN: Enhanced super-resolution generative adversarial networks","author":"wang","year":"2018","journal-title":"Eur Conf Comput Vis Workshop"},{"key":"ref47","first-page":"108","article-title":"Axial-deeplab: Stand-alone axial-attention for panoptic segmentation","author":"wang","year":"2020","journal-title":"Eur Conf Comput Vis"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2006.881959"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2005.859389"},{"key":"ref44","first-page":"1","article-title":"Inception-v4, inceptionresnet and the impact of residual connections on learning","author":"szegedy","year":"2017","journal-title":"AAAI"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2011.2166082"}],"event":{"name":"2021 IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)","location":"Nashville, TN, USA","start":{"date-parts":[[2021,6,19]]},"end":{"date-parts":[[2021,6,25]]}},"container-title":["2021 IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops (CVPRW)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9522011\/9522684\/09523022.pdf?arnumber=9523022","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,8,2]],"date-time":"2022-08-02T23:53:23Z","timestamp":1659484403000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9523022\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,6]]},"references-count":61,"URL":"https:\/\/doi.org\/10.1109\/cvprw53098.2021.00054","relation":{},"subject":[],"published":{"date-parts":[[2021,6]]}}}