{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,9]],"date-time":"2025-09-09T21:35:05Z","timestamp":1757453705585,"version":"3.41.0"},"publisher-location":"Cham","reference-count":62,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031918551","type":"print"},{"value":"9783031918568","type":"electronic"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-91856-8_13","type":"book-chapter","created":{"date-parts":[[2025,5,23]],"date-time":"2025-05-23T11:16:41Z","timestamp":1747999001000},"page":"212-228","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["AIM 2024 Challenge on\u00a0Compressed Video Quality Assessment: Methods and\u00a0Results"],"prefix":"10.1007","author":[{"given":"Maksim","family":"Smirnov","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Aleksandr","family":"Gushchin","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Anastasia","family":"Antsiferova","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dmitry","family":"Vatolin","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Radu","family":"Timofte","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ziheng","family":"Jia","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zicheng","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Wei","family":"Sun","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jiaying","family":"Qian","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yuqin","family":"Cao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yinan","family":"Sun","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yuxin","family":"Zhu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xiongkuo","family":"Min","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Guangtao","family":"Zhai","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kanjar","family":"De","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Qing","family":"Luo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ao-Xiang","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Peng","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Haibo","family":"Lei","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Linyan","family":"Jiang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yaqing","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Wenhui","family":"Meng","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xiaoheng","family":"Tan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Haiqiang","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xiaozhong","family":"Xu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shan","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhenzhong","family":"Chen","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhengxue","family":"Cheng","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jiahao","family":"Xiao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jun","family":"Xu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Chenlong","family":"He","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Qi","family":"Zheng","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ruoxi","family":"Zhu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Min","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yibo","family":"Fan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhengzhong","family":"Tu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,5,12]]},"reference":[{"key":"13_CR1","unstructured":"Recommended encoding settings for IBM Watson media. https:\/\/support.video.ibm.com\/hc\/en-us\/articles\/207852117-Internet-connection-and-recommended-encoding-settings. Accessed 12 Aug 2022"},{"key":"13_CR2","unstructured":"Recommended encoding settings for twitch streaming. https:\/\/stream.twitch.tv\/encoding\/. Accessed 12 Aug 2022"},{"key":"13_CR3","unstructured":"Recommended encoding settings for youtube. https:\/\/support.google.com\/youtube\/answer\/2853702. Accessed 12 Aug 2022"},{"key":"13_CR4","doi-asserted-by":"crossref","unstructured":"Akiba, T., Sano, S., Yanase, T., Ohta, T., Koyama, M.: Optuna: a next-generation hyperparameter optimization framework. In: Proceedings of the 25th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining (2019)","DOI":"10.1145\/3292500.3330701"},{"key":"13_CR5","first-page":"13814","volume":"35","author":"A Antsiferova","year":"2022","unstructured":"Antsiferova, A., Lavrushkin, S., Smirnov, M., Gushchin, A., Vatolin, D., Kulikov, D.: Video compression dataset and benchmark of learning-based video-quality metrics. Adv. Neural. Inf. Process. Syst. 35, 13814\u201313825 (2022)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"issue":"11","key":"13_CR6","doi-asserted-by":"publisher","first-page":"5217","DOI":"10.1109\/TIP.2017.2729891","volume":"26","author":"CG Bampis","year":"2017","unstructured":"Bampis, C.G., Li, Z., Moorthy, A.K., Katsavounidis, I., Aaron, A., Bovik, A.C.: Study of temporal effects on subjective video quality of experience. IEEE Trans. Image Process. 26(11), 5217\u20135231 (2017)","journal-title":"IEEE Trans. Image Process."},{"issue":"1","key":"13_CR7","doi-asserted-by":"publisher","first-page":"206","DOI":"10.1109\/TIP.2017.2760518","volume":"27","author":"S Bosse","year":"2018","unstructured":"Bosse, S., Maniry, D., M\u00fcller, K.R., Wiegand, T., Samek, W.: Deep neural networks for no-reference and full-reference image quality assessment. IEEE Trans. Image Process. 27(1), 206\u2013219 (2018). https:\/\/doi.org\/10.1109\/TIP.2017.2760518","journal-title":"IEEE Trans. Image Process."},{"key":"13_CR8","doi-asserted-by":"crossref","unstructured":"Chen, C., et al.: TOPIQ: a top-down approach from semantics to distortions for image quality assessment. arXiv preprint arXiv:2308.03060 (2023)","DOI":"10.1109\/TIP.2024.3378466"},{"key":"13_CR9","unstructured":"Conde, M.V., et\u00a0al.: AIM 2024 challenge on raw burst alignment via optical flow estimation. In: Proceedings of the European Conference on Computer Vision (ECCV) Workshops (2024)"},{"key":"13_CR10","unstructured":"Conde, M.V., Lei, Z., Li, W., Katsavounidis, I., Timofte, R., et\u00a0al.: AIM 2024 challenge on efficient video super-resolution for AV1 compressed content. In: Proceedings of the European Conference on Computer Vision (ECCV) Workshops (2024)"},{"key":"13_CR11","unstructured":"Conde, M.V., et\u00a0al.: Compressed depth map super-resolution and restoration: AIM 2024 challenge results. In: Proceedings of the European Conference on Computer Vision (ECCV) Workshops (2024)"},{"key":"13_CR12","doi-asserted-by":"publisher","unstructured":"Corey, D., Dunlap, W., Burke, M.: Averaging correlations: expected values and bias in combined Pearson RS and Fisher\u2019s Z transformations. J. Gen. Psychol. 125, 245\u2013261 (1998). https:\/\/doi.org\/10.1080\/00221309809595548","DOI":"10.1080\/00221309809595548"},{"issue":"2","key":"13_CR13","doi-asserted-by":"publisher","first-page":"105","DOI":"10.5566\/ias.1534","volume":"37","author":"K De","year":"2018","unstructured":"De, K., Masilamani, V.: No-reference image quality measure for images with multiple distortions using random forests for multi method fusion. Image Anal. Stereol. 37(2), 105\u2013117 (2018)","journal-title":"Image Anal. Stereol."},{"key":"13_CR14","doi-asserted-by":"crossref","unstructured":"De\u00a0Simone, F., Tagliasacchi, M., Naccari, M., Tubaro, S., Ebrahimi, T.: A H. 264\/AVC video database for the evaluation of quality metrics. In: 2010 IEEE International Conference on Acoustics, Speech and Signal Processing, pp. 2430\u20132433. IEEE (2010)","DOI":"10.1109\/ICASSP.2010.5496296"},{"key":"13_CR15","doi-asserted-by":"publisher","unstructured":"Ding, K., Ma, K., Wang, S., Simoncelli, E.: Image quality assessment: unifying structure and texture similarity. IEEE Trans. Pattern Anal. Mach. Intell. PP, 1 (2020). https:\/\/doi.org\/10.1109\/TPAMI.2020.3045810","DOI":"10.1109\/TPAMI.2020.3045810"},{"key":"13_CR16","doi-asserted-by":"crossref","unstructured":"Feichtenhofer, C., Fan, H., Malik, J., He, K.: SlowFast networks for video recognition. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 6202\u20136211 (2019)","DOI":"10.1109\/ICCV.2019.00630"},{"issue":"9","key":"13_CR17","doi-asserted-by":"publisher","first-page":"2061","DOI":"10.1109\/TCSVT.2017.2707479","volume":"28","author":"D Ghadiyaram","year":"2017","unstructured":"Ghadiyaram, D., Pan, J., Bovik, A.C., Moorthy, A.K., Panda, P., Yang, K.C.: In-capture mobile video distortions: a study of subjective behavior and objective algorithms. IEEE Trans. Circuits Syst. Video Technol. 28(9), 2061\u20132077 (2017)","journal-title":"IEEE Trans. Circuits Syst. Video Technol."},{"key":"13_CR18","unstructured":"Gushchin, A., Smirnov, M., Antsiferova, A., Lyapustin, E., Vatolin, D.: MSU CVQAD: compressed video quality assessment dataset (2022). https:\/\/videoprocessing.ai\/datasets\/cvqad.html"},{"key":"13_CR19","doi-asserted-by":"crossref","unstructured":"He, C., Zheng, Q., Zhu, R., Zeng, X., Fan, Y., Tu, Z.: Cover: a comprehensive video quality evaluator. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5799\u20135809 (2024)","DOI":"10.1109\/CVPRW63382.2024.00589"},{"key":"13_CR20","unstructured":"Hosu, V., et\u00a0al.: AIM 2024 challenge on UHD blind photo quality assessment. In: Proceedings of the European Conference on Computer Vision (ECCV) Workshops (2024)"},{"key":"13_CR21","doi-asserted-by":"crossref","unstructured":"Hosu, V., et al.: The Konstanz natural video database (koNViD-1K). In: 2017 Ninth International Conference on Quality of Multimedia Experience (QoMEX), pp.\u00a01\u20136. IEEE (2017)","DOI":"10.1109\/QoMEX.2017.7965673"},{"key":"13_CR22","doi-asserted-by":"publisher","first-page":"4041","DOI":"10.1109\/TIP.2020.2967829","volume":"29","author":"V Hosu","year":"2020","unstructured":"Hosu, V., Lin, H., Sziranyi, T., Saupe, D.: KonIQ-10k: an ecologically valid database for deep learning of blind image quality assessment. IEEE Trans. Image Process. 29, 4041\u20134056 (2020). https:\/\/doi.org\/10.1109\/TIP.2020.2967829","journal-title":"IEEE Trans. Image Process."},{"key":"13_CR23","unstructured":"Kastryulin, S., Zakirov, D., Prokopenko, D.: PyTorch Image Quality: Metrics and measure for image quality assessment (2019). https:\/\/github.com\/photosynthesis-team\/piq, open-source software available at https:\/\/github.com\/photosynthesis-team\/piq"},{"key":"13_CR24","doi-asserted-by":"publisher","unstructured":"Kastryulin, S., Zakirov, J., Prokopenko, D., Dylov, D.V.: PyTorch image quality: metrics for image quality assessment (2022). https:\/\/doi.org\/10.48550\/ARXIV.2208.14818. https:\/\/arxiv.org\/abs\/2208.14818","DOI":"10.48550\/ARXIV.2208.14818"},{"key":"13_CR25","doi-asserted-by":"crossref","unstructured":"Keimel, C., Redl, A., Diepold, K.: The tum high definition video datasets. In: 2012 Fourth International Workshop on Quality of Multimedia Experience, pp. 97\u2013102. IEEE (2012)","DOI":"10.1109\/QoMEX.2012.6263865"},{"key":"13_CR26","doi-asserted-by":"crossref","unstructured":"Lao, S., et al.: Attentions help CNNs see better: attention-based hybrid image quality assessment network. arXiv preprint arXiv:2204.10485 (2022)","DOI":"10.1109\/CVPRW56347.2022.00123"},{"key":"13_CR27","doi-asserted-by":"crossref","unstructured":"Li, D., Jiang, T., Jiang, M.: Quality assessment of in-the-wild videos. In: Proceedings of the 27th ACM International Conference on Multimedia, pp. 2351\u20132359 (2019)","DOI":"10.1145\/3343031.3351028"},{"key":"13_CR28","doi-asserted-by":"crossref","unstructured":"Li, D., Jiang, T., Jiang, M.: Norm-in-norm loss with faster convergence and better performance for image quality assessment. In: Proceedings of the 28th ACM International Conference on Multimedia, pp. 789\u2013797 (2020)","DOI":"10.1145\/3394171.3413804"},{"key":"13_CR29","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.jvcir.2015.02.012","volume":"30","author":"JY Lin","year":"2015","unstructured":"Lin, J.Y., Song, R., Wu, C.H., Liu, T., Wang, H., Kuo, C.: MCL-V: a streaming video quality assessment database. J. Vis. Commun. Image Represent. 30, 1\u20139 (2015)","journal-title":"J. Vis. Commun. Image Represent."},{"key":"13_CR30","doi-asserted-by":"crossref","unstructured":"Liu, H., Li, C., Li, Y., Lee, Y.J.: Improved baselines with visual instruction tuning (2023)","DOI":"10.1109\/CVPR52733.2024.02484"},{"key":"13_CR31","unstructured":"Liu, H., et al.: LLaVA-next: Improved reasoning, OCR, and world knowledge (2024). https:\/\/llava-vl.github.io\/blog\/2024-01-30-llava-next\/"},{"key":"13_CR32","unstructured":"Liu, H., Li, C., Wu, Q., Lee, Y.J.: Visual instruction tuning (2023)"},{"key":"13_CR33","doi-asserted-by":"publisher","unstructured":"Liu, X., Van De\u00a0Weijer, J., Bagdanov, A.D.: RankIQA: learning from rankings for no-reference image quality assessment. In: 2017 IEEE International Conference on Computer Vision (ICCV), pp. 1040\u20131049 (2017). https:\/\/doi.org\/10.1109\/ICCV.2017.118","DOI":"10.1109\/ICCV.2017.118"},{"key":"13_CR34","doi-asserted-by":"crossref","unstructured":"Liu, Z., et al.: Swin transformer: hierarchical vision transformer using shifted windows. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 10012\u201310022 (2021)","DOI":"10.1109\/ICCV48922.2021.00986"},{"issue":"2","key":"13_CR35","doi-asserted-by":"publisher","first-page":"129","DOI":"10.1109\/TIT.1982.1056489","volume":"28","author":"S Lloyd","year":"1982","unstructured":"Lloyd, S.: Least squares quantization in PCM. IEEE Trans. Inf. Theory 28(2), 129\u2013137 (1982)","journal-title":"IEEE Trans. Inf. Theory"},{"key":"13_CR36","doi-asserted-by":"publisher","first-page":"6054","DOI":"10.1109\/TIP.2020.2988148","volume":"29","author":"X Min","year":"2020","unstructured":"Min, X., Zhai, G., Zhou, J., Farias, M.C., Bovik, A.C.: Study of subjective and objective quality assessment of audio-visual signals. IEEE Trans. Image Process. 29, 6054\u20136068 (2020)","journal-title":"IEEE Trans. Image Process."},{"issue":"12","key":"13_CR37","doi-asserted-by":"publisher","first-page":"4695","DOI":"10.1109\/TIP.2012.2214050","volume":"21","author":"A Mittal","year":"2012","unstructured":"Mittal, A., Moorthy, A.K., Bovik, A.C.: No-reference image quality assessment in the spatial domain. IEEE Trans. Image Process. 21(12), 4695\u20134708 (2012). https:\/\/doi.org\/10.1109\/TIP.2012.2214050","journal-title":"IEEE Trans. Image Process."},{"key":"13_CR38","unstructured":"Molodetskikh, I., Borisov, A., Vatolin, D.S., Timofte, R., et\u00a0al.: AIM 2024 challenge on video super-resolution quality assessment: Methods and results. In: Proceedings of the European Conference on Computer Vision (ECCV) Workshops (2024)"},{"key":"13_CR39","unstructured":"Moskalenko, A., Bryntsev, A., Vatolin, D.S., Timofte, R., et\u00a0al.: AIM 2024 challenge on video saliency prediction: Methods and results. In: Proceedings of the European Conference on Computer Vision (ECCV) Workshops (2024)"},{"key":"13_CR40","unstructured":"Nazarczuk, M., et\u00a0al.: AIM 2024 sparse neural rendering challenge: methods and results. In: Proceedings of the European Conference on Computer Vision (ECCV) Workshops (2024)"},{"key":"13_CR41","unstructured":"Nazarczuk, M., Tanay, T., Catley-Chandar, S., Shaw, R., Timofte, R., P\u00e9rez-Pellitero, E.: AIM 2024 sparse neural rendering challenge: dataset and benchmark. In: Proceedings of the European Conference on Computer Vision (ECCV) Workshops (2024)"},{"issue":"7","key":"13_CR42","doi-asserted-by":"publisher","first-page":"3073","DOI":"10.1109\/TIP.2016.2562513","volume":"25","author":"M Nuutinen","year":"2016","unstructured":"Nuutinen, M., Virtanen, T., Vaahteranoksa, M., Vuori, T., Oittinen, P., H\u00e4kkinen, J.: CVD 2014-a database for evaluating no-reference video quality assessment algorithms. IEEE Trans. Image Process. 25(7), 3073\u20133086 (2016)","journal-title":"IEEE Trans. Image Process."},{"key":"13_CR43","doi-asserted-by":"crossref","unstructured":"Paudyal, P., Battisti, F., Carli, M.: A study on the effects of quality of service parameters on perceived video quality. In: 2014 5th European Workshop on Visual Information Processing (EUVIP), pp.\u00a01\u20136. IEEE (2014)","DOI":"10.1109\/EUVIP.2014.7018383"},{"key":"13_CR44","doi-asserted-by":"publisher","unstructured":"Reisenhofer, R., Bosse, S., Kutyniok, G., Wiegand, T.: A Haar wavelet-based perceptual similarity index for image quality assessment. Signal Process. Image Commun. 61, 33\u201343 (2018). https:\/\/doi.org\/10.1016\/j.image.2017.11.001","DOI":"10.1016\/j.image.2017.11.001"},{"issue":"2","key":"13_CR45","doi-asserted-by":"publisher","first-page":"612","DOI":"10.1109\/TIP.2018.2869673","volume":"28","author":"Z Sinno","year":"2018","unstructured":"Sinno, Z., Bovik, A.C.: Large-scale study of perceptual video quality. IEEE Trans. Image Process. 28(2), 612\u2013627 (2018)","journal-title":"IEEE Trans. Image Process."},{"key":"13_CR46","doi-asserted-by":"crossref","unstructured":"Stroud, J., Ross, D., Sun, C., Deng, J., Sukthankar, R.: D3D: distilled 3D networks for video action recognition. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, pp. 625\u2013634 (2020)","DOI":"10.1109\/WACV45572.2020.9093274"},{"key":"13_CR47","doi-asserted-by":"crossref","unstructured":"Wang, H., et al.: MCL-JCV: A JND-based H. 264\/AVC video quality assessment dataset. In: 2016 IEEE International Conference on Image Processing (ICIP), pp. 1509\u20131513. IEEE (2016)","DOI":"10.1109\/ICIP.2016.7532610"},{"key":"13_CR48","doi-asserted-by":"publisher","first-page":"292","DOI":"10.1016\/j.jvcir.2017.04.009","volume":"46","author":"H Wang","year":"2017","unstructured":"Wang, H., et al.: VideoSet: a large-scale compressed video quality dataset based on JND measurement. J. Vis. Commun. Image Represent. 46, 292\u2013302 (2017)","journal-title":"J. Vis. Commun. Image Represent."},{"key":"13_CR49","doi-asserted-by":"crossref","unstructured":"Wang, J., Chan, K.C., Loy, C.C.: Exploring clip for assessing the look and feel of images. In: AAAI (2023)","DOI":"10.1609\/aaai.v37i2.25353"},{"key":"13_CR50","doi-asserted-by":"crossref","unstructured":"Wang, Y., Inguva, S., Adsumilli, B.: Youtube UGC dataset for video compression research. In: 2019 IEEE 21st International Workshop on Multimedia Signal Processing (MMSP), pp.\u00a01\u20135. IEEE (2019)","DOI":"10.1109\/MMSP.2019.8901772"},{"key":"13_CR51","doi-asserted-by":"crossref","unstructured":"Wang, Y., et al.: Rich features for perceptual quality assessment of UGC videos. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 13435\u201313444 (2021)","DOI":"10.1109\/CVPR46437.2021.01323"},{"key":"13_CR52","unstructured":"Wang, Z., Simoncelli, E.P., Bovik, A.C.: Multiscale structural similarity for image quality assessment. In: The Thrity-Seventh Asilomar Conference on Signals, Systems & Computers, vol.\u00a02, pp. 1398\u20131402. IEEE (2003)"},{"key":"13_CR53","doi-asserted-by":"crossref","unstructured":"Wu, H., et al.: Fast-VQA: efficient end-to-end video quality assessment with fragment sampling. In: European Conference on Computer Vision, pp. 538\u2013554. Springer (2022)","DOI":"10.1007\/978-3-031-20068-7_31"},{"key":"13_CR54","doi-asserted-by":"crossref","unstructured":"Wu, H., et al.: Q-instruct: improving low-level visual abilities for multi-modality foundation models (2023)","DOI":"10.1109\/CVPR52733.2024.02408"},{"key":"13_CR55","unstructured":"Wu, H., et al.: Q-align: teaching LMMs for visual scoring via discrete text-defined levels. arXiv preprint arXiv:2312.17090 (2023)"},{"key":"13_CR56","doi-asserted-by":"crossref","unstructured":"Ying, Z., Mandal, M., Ghadiyaram, D., Bovik, A.: Patch-VQ: \u2018patching up\u2019 the video quality problem. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 14019\u201314029 (2021)","DOI":"10.1109\/CVPR46437.2021.01380"},{"key":"13_CR57","doi-asserted-by":"crossref","unstructured":"Ying, Z., Niu, H., Gupta, P., Mahajan, D., Ghadiyaram, D., Bovik, A.: From patches to pictures (PaQ-2-PiQ): mapping the perceptual space of picture quality. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 3575\u20133585 (2020)","DOI":"10.1109\/CVPR42600.2020.00363"},{"issue":"8","key":"13_CR58","doi-asserted-by":"publisher","first-page":"4749","DOI":"10.1109\/TCYB.2023.3338615","volume":"54","author":"AX Zhang","year":"2024","unstructured":"Zhang, A.X., Wang, Y.G., Tang, W., Li, L., Kwong, S.: A spatial-temporal video quality assessment method via comprehensive HVS simulation. IEEE Trans. Cybernet. 54(8), 4749\u20134762 (2024). https:\/\/doi.org\/10.1109\/TCYB.2023.3338615","journal-title":"IEEE Trans. Cybernet."},{"key":"13_CR59","doi-asserted-by":"publisher","unstructured":"Zhang, R., Isola, P., Efros, A.A., Shechtman, E., Wang, O.: The unreasonable effectiveness of deep features as a perceptual metric. In: 2018 IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 586\u2013595 (2018). https:\/\/doi.org\/10.1109\/CVPR.2018.00068","DOI":"10.1109\/CVPR.2018.00068"},{"issue":"1","key":"13_CR60","doi-asserted-by":"publisher","first-page":"36","DOI":"10.1109\/TCSVT.2018.2886771","volume":"30","author":"W Zhang","year":"2020","unstructured":"Zhang, W., Ma, K., Yan, J., Deng, D., Wang, Z.: Blind image quality assessment using a deep bilinear convolutional neural network. IEEE Trans. Circuits Syst. Video Technol. 30(1), 36\u201347 (2020)","journal-title":"IEEE Trans. Circuits Syst. Video Technol."},{"key":"13_CR61","doi-asserted-by":"crossref","unstructured":"Zhang, W., Zhai, G., Wei, Y., Yang, X., Ma, K.: Blind image quality assessment via vision-language correspondence: a multitask learning perspective. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 14071\u201314081 (2023)","DOI":"10.1109\/CVPR52729.2023.01352"},{"key":"13_CR62","doi-asserted-by":"crossref","unstructured":"Zhu, H., Li, L., Wu, J., Dong, W., Shi, G.: MetaIQA: deep meta-learning for no-reference image quality assessment. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 14143\u201314152 (2020)","DOI":"10.1109\/CVPR42600.2020.01415"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2024 Workshops"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-91856-8_13","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,23]],"date-time":"2025-05-23T11:16:58Z","timestamp":1747999018000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-91856-8_13"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9783031918551","9783031918568"],"references-count":62,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-91856-8_13","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"12 May 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Milan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2024.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}