{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,24]],"date-time":"2026-02-24T19:08:28Z","timestamp":1771960108623,"version":"3.50.1"},"reference-count":122,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"funder":[{"DOI":"10.13039\/501100004832","name":"Khalifa University of Science and Technology","doi-asserted-by":"publisher","award":["CIRA-2021-085"],"award-info":[{"award-number":["CIRA-2021-085"]}],"id":[{"id":"10.13039\/501100004832","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100004832","name":"Khalifa University of Science and Technology","doi-asserted-by":"publisher","award":["FSU-2021-019"],"award-info":[{"award-number":["FSU-2021-019"]}],"id":[{"id":"10.13039\/501100004832","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100004832","name":"Khalifa University of Science and Technology","doi-asserted-by":"publisher","award":["RC1-2018-KUCARS"],"award-info":[{"award-number":["RC1-2018-KUCARS"]}],"id":[{"id":"10.13039\/501100004832","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Research Start-Up Grant at United Arab Emirates University, United Arab Emirates","award":["G00004613"],"award-info":[{"award-number":["G00004613"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Access"],"published-print":{"date-parts":[[2024]]},"DOI":"10.1109\/access.2024.3506273","type":"journal-article","created":{"date-parts":[[2024,11,25]],"date-time":"2024-11-25T18:49:07Z","timestamp":1732560547000},"page":"183369-183393","source":"Crossref","is-referenced-by-count":18,"title":["IQA Vision Transformed: A Survey of Transformer Architectures in Perceptual Image Quality Assessment"],"prefix":"10.1109","volume":"12","author":[{"given":"Mobeen Ur","family":"Rehman","sequence":"first","affiliation":[{"name":"Khalifa University Center for Autonomous Robotic Systems (KUCARS), Khalifa University, Abu Dhabi, United Arab Emirates"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2693-4085","authenticated-orcid":false,"given":"Imran Fareed","family":"Nizami","sequence":"additional","affiliation":[{"name":"Department of Electrical Engineering, Bahria University, Islamabad, Pakistan"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2488-8353","authenticated-orcid":false,"given":"Farman","family":"Ullah","sequence":"additional","affiliation":[{"name":"College of Information Technology, United Arab Emirates University, Al Ain, United Arab Emirates"}]},{"given":"Irfan","family":"Hussain","sequence":"additional","affiliation":[{"name":"Khalifa University Center for Autonomous Robotic Systems (KUCARS), Khalifa University, Abu Dhabi, United Arab Emirates"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2008.930649"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2003.819861"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1080\/00401706.1995.10484391"},{"key":"ref4","first-page":"207","article-title":"What\u2019s wrong with mean-squared error?","volume-title":"Digital Images and Human Vision","author":"Girod","year":"1993"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01167"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1989.1.4.541"},{"key":"ref7","first-page":"1","article-title":"Imagenet classification with deep convolutional neural networks","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"25","author":"Krizhevsky"},{"key":"ref8","volume-title":"Deep Learning","author":"Goodfellow","year":"2016"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref10","article-title":"An image is worth 16\u00d716 words: Transformers for image recognition at scale","author":"Dosovitskiy","year":"2020","journal-title":"arXiv:2010.11929"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01270"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00813"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1145\/3465055"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00681"},{"key":"ref15","article-title":"Deformable DETR: Deformable transformers for end-to-end object detection","author":"Zhu","year":"2020","journal-title":"arXiv:2010.04159"},{"key":"ref16","first-page":"23296","article-title":"Intriguing properties of vision transformers","volume-title":"Proc. NIPS","volume":"34","author":"Naseer"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.conll-1.48"},{"key":"ref18","first-page":"23885","article-title":"Partial success in closing the gap between human and machine vision","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"34","author":"Geirhos"},{"key":"ref19","article-title":"Are convolutional neural networks or transformers more like human vision?","author":"Tuli","year":"2021","journal-title":"arXiv:2105.07197"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1145\/3597434"},{"key":"ref21","article-title":"VTAMIQ: Transformers for attention modulated image quality assessment","author":"Chubarau","year":"2021","journal-title":"arXiv:2110.01655"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2022.10.007"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1117\/12.3006137"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1016\/j.procs.2023.08.080"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1145\/3606692"},{"key":"ref26","first-page":"2","article-title":"Bert: Pre-training of deep bidirectional transformers for language understanding","volume-title":"Proc. Naacl-HLT","volume":"1","author":"Devlin"},{"key":"ref27","article-title":"AMMUS: A survey of transformer-based pretrained models in natural language processing","author":"Kalyan","year":"2021","journal-title":"arXiv:2108.05542"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58558-7_29"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-92910-9_11"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1016\/j.jvcir.2011.01.005"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2012.2214048"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2011.2175935"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2011.2109730"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2008.2011760"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP.2002.1038064"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2005.854492"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2014.2372333"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2016.2537321"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2010.2043888"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2011.2147325"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2012.2191563"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2012.2214050"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2014.2355716"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2014.2373812"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2016.2601028"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.224"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2012.6247789"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2012.2227726"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2015.2426416"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2013.133"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2017.2760518"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP.2016.7533065"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.213"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW53098.2021.00044"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2020.3030895"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2020.3045810"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00194"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00068"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2017.2774045"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2019.2904879"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2018.2886771"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01415"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00372"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1364\/JOSAA.448144"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1145\/3394171.3413804"},{"key":"ref67","article-title":"Very deep convolutional networks for large-scale image recognition","author":"Simonyan","year":"2014","journal-title":"arXiv:1409.1556"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00745"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01234-2_18"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00569"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00758"},{"key":"ref73","article-title":"MS-UNIQUE: Multi-model and sharpness-weighted unsupervised image quality estimation","author":"Prabhushankar","year":"2018","journal-title":"arXiv:1811.08947"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00513"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.1109\/WACVW54805.2022.00015"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW53098.2021.00054"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2022.3209810"},{"key":"ref78","doi-asserted-by":"publisher","DOI":"10.3390\/math11071599"},{"key":"ref79","article-title":"Learning transformer features for image quality assessment","author":"Zeng","year":"2021","journal-title":"arXiv:2112.00485"},{"key":"ref80","article-title":"Multi-scale features and parallel transformers based image quality assessment","author":"Keshari","year":"2022","journal-title":"arXiv:2204.09779"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v31i1.11231"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1016\/j.jvcir.2023.103850"},{"key":"ref83","article-title":"Blind image quality assessment via transformer predicted error map and perceptual quality token","author":"Shi","year":"2023","journal-title":"arXiv:2305.09353"},{"key":"ref84","article-title":"Local distortion aware efficient transformer adaptation for image quality assessment","author":"Xu","year":"2023","journal-title":"arXiv:2308.12001"},{"key":"ref85","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2022.119268"},{"key":"ref86","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW54120.2021.00222"},{"key":"ref87","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i2.25302"},{"key":"ref88","doi-asserted-by":"publisher","DOI":"10.1007\/s10489-023-05104-3"},{"key":"ref89","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP42928.2021.9506075"},{"key":"ref90","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2022.3224319"},{"key":"ref91","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2021.3112197"},{"key":"ref92","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2023.126437"},{"key":"ref93","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10096042"},{"key":"ref94","doi-asserted-by":"publisher","DOI":"10.3390\/electronics11142132"},{"key":"ref95","doi-asserted-by":"publisher","DOI":"10.1109\/WACV51458.2022.00404"},{"key":"ref96","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP49359.2023.10222634"},{"key":"ref97","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00510"},{"key":"ref98","doi-asserted-by":"publisher","DOI":"10.1007\/s00521-023-09188-3"},{"key":"ref99","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW56347.2022.00133"},{"key":"ref100","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW56347.2022.00126"},{"key":"ref101","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW56347.2022.00123"},{"key":"ref102","doi-asserted-by":"publisher","DOI":"10.5555\/3045118.3045167"},{"key":"ref103","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2006.881959"},{"key":"ref104","doi-asserted-by":"publisher","DOI":"10.1117\/1.3267105"},{"key":"ref105","first-page":"106","article-title":"Color image database TID2013: Peculiarities and preliminary results","volume-title":"Proc. Eur. Workshop Vis. Inf. Process. (EUVIP)","author":"Ponomarenko"},{"key":"ref106","doi-asserted-by":"publisher","DOI":"10.1109\/QoMEX.2019.8743252"},{"key":"ref107","article-title":"PIPAL: A large-scale image quality assessment dataset for perceptual image restoration","author":"Gu","year":"2020","journal-title":"arXiv:2007.12142"},{"key":"ref108","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW56347.2022.00109"},{"key":"ref109","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2016.07.033"},{"key":"ref110","doi-asserted-by":"publisher","DOI":"10.1145\/2812802"},{"key":"ref111","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2020.2967829"},{"key":"ref112","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00373"},{"key":"ref113","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2015.2500021"},{"key":"ref114","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2014.2378061"},{"key":"ref115","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2010.2053549"},{"key":"ref116","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00363"},{"key":"ref117","article-title":"Final report from the Video Quality Experts Group on the validation of objective models of video quality assessment","author":"Antkowiak","year":"2000"},{"key":"ref118","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2102.10882"},{"key":"ref119","doi-asserted-by":"publisher","DOI":"10.1162\/coli_a_00445"},{"key":"ref120","article-title":"A survey of domain adaptation for neural machine translation","author":"Chu","year":"2018","journal-title":"arXiv:1806.00258"},{"key":"ref121","first-page":"1","article-title":"Transformer-xl: Language modeling with longer-term dependency","volume-title":"Proc. ICLR","author":"Dai"},{"key":"ref122","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P19-1146"}],"container-title":["IEEE Access"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/6287639\/10380310\/10767243.pdf?arnumber=10767243","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,12,12]],"date-time":"2024-12-12T07:44:42Z","timestamp":1733989482000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10767243\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024]]},"references-count":122,"URL":"https:\/\/doi.org\/10.1109\/access.2024.3506273","relation":{},"ISSN":["2169-3536"],"issn-type":[{"value":"2169-3536","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024]]}}}