{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,20]],"date-time":"2026-05-20T16:44:23Z","timestamp":1779295463633,"version":"3.51.4"},"publisher-location":"Cham","reference-count":56,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031918551","type":"print"},{"value":"9783031918568","type":"electronic"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-91856-8_11","type":"book-chapter","created":{"date-parts":[[2025,5,23]],"date-time":"2025-05-23T11:02:05Z","timestamp":1747998125000},"page":"178-194","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["AIM 2024 Challenge on\u00a0Video Saliency Prediction: Methods and\u00a0Results"],"prefix":"10.1007","author":[{"given":"Andrey","family":"Moskalenko","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Alexey","family":"Bryncev","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dmitry","family":"Vatolin","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Radu","family":"Timofte","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Gen","family":"Zhan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Li","family":"Yang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yunlong","family":"Tang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yiting","family":"Liao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jiongzhi","family":"Lin","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Baitao","family":"Huang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Morteza","family":"Moradi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mohammad","family":"Moradi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Francesco","family":"Rundo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Concetto","family":"Spampinato","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ali","family":"Borji","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Simone","family":"Palazzo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yuxin","family":"Zhu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yinan","family":"Sun","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Huiyu","family":"Duan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yuqin","family":"Cao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ziheng","family":"Jia","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Qiang","family":"Hu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xiongkuo","family":"Min","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Guangtao","family":"Zhai","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hao","family":"Fang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Runmin","family":"Cong","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xiankai","family":"Lu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xiaofei","family":"Zhou","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Wei","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Chunyu","family":"Zhao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Wentao","family":"Mu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tao","family":"Deng","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hamed R.","family":"Tavakoli","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,5,12]]},"reference":[{"issue":"8","key":"11_CR1","doi-asserted-by":"publisher","first-page":"11917","DOI":"10.1007\/s11042-020-10185-0","volume":"80","author":"M Ahmadi","year":"2021","unstructured":"Ahmadi, M., Karimi, N., Samavi, S.: Context-aware saliency detection for image retargeting using convolutional neural networks. Multimed. Tools Appl. 80(8), 11917\u201311941 (2021). https:\/\/doi.org\/10.1007\/s11042-020-10185-0","journal-title":"Multimed. Tools Appl."},{"issue":"7","key":"11_CR2","doi-asserted-by":"publisher","first-page":"1688","DOI":"10.1109\/TMM.2017.2777665","volume":"20","author":"C Bak","year":"2017","unstructured":"Bak, C., Kocak, A., Erdem, E., Erdem, A.: Spatio-temporal saliency networks for dynamic saliency prediction. IEEE Trans. Multimedia 20(7), 1688\u20131698 (2017)","journal-title":"IEEE Trans. Multimedia"},{"issue":"3","key":"11_CR3","doi-asserted-by":"publisher","first-page":"740","DOI":"10.1109\/TPAMI.2018.2815601","volume":"41","author":"Z Bylinskii","year":"2018","unstructured":"Bylinskii, Z., Judd, T., Oliva, A., Torralba, A., Durand, F.: What do different evaluation metrics tell us about saliency models? IEEE Trans. Pattern Anal. Mach. Intell. 41(3), 740\u2013757 (2018)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"11_CR4","unstructured":"Conde, M.V., et\u00a0al.: AIM 2024 challenge on raw burst alignment via optical flow estimation. In: Proceedings of the European Conference on Computer Vision (ECCV) Workshops (2024)"},{"key":"11_CR5","unstructured":"Conde, M.V., et\u00a0al.: AIM 2024 challenge on efficient video super-resolution for AV1 compressed content. In: Proceedings of the European Conference on Computer Vision (ECCV) Workshops (2024)"},{"key":"11_CR6","unstructured":"Conde, M.V., et\u00a0al.: Compressed depth map super-resolution and restoration: AIM 2024 challenge results. In: Proceedings of the European Conference on Computer Vision (ECCV) Workshops (2024)"},{"key":"11_CR7","doi-asserted-by":"crossref","unstructured":"Cornia, M., Baraldi, L., Serra, G., Cucchiara, R.: Predicting human eye fixations via an LSTM-based saliency attentive model. IEEE Trans. Image Process. 27(10), 5142\u20135154 (2018)","DOI":"10.1109\/TIP.2018.2851672"},{"key":"11_CR8","unstructured":"Dao, T., Gu, A.: Transformers are SSMS: generalized models and efficient algorithms through structured state space duality. arXiv preprint arXiv:2405.21060 (2024)"},{"issue":"9","key":"11_CR9","doi-asserted-by":"publisher","first-page":"3888","DOI":"10.1109\/TIP.2012.2199126","volume":"21","author":"Y Fang","year":"2012","unstructured":"Fang, Y., Chen, Z., Lin, W., Lin, C.W.: Saliency detection in the compressed domain for adaptive image retargeting. IEEE Trans. Image Process. 21(9), 3888\u20133901 (2012)","journal-title":"IEEE Trans. Image Process."},{"key":"11_CR10","doi-asserted-by":"crossref","unstructured":"Gitman, Y., Erofeev, M., Vatolin, D., Bolshakov, A., Fedorov, A.: Semiautomatic Visual-Attention modeling and its application to video compression. In: 2014 IEEE International Conference on Image Processing (ICIP) (ICIP 2014), Paris, France, pp. 1105\u20131109 (2014)","DOI":"10.1109\/ICIP.2014.7025220"},{"key":"11_CR11","unstructured":"Gu, A., Dao, T.: Mamba: linear-time sequence modeling with selective state spaces. arXiv preprint arXiv:2312.00752 (2023)"},{"key":"11_CR12","doi-asserted-by":"crossref","unstructured":"Gu, K., et al.: Saliency-guided quality assessment of screen content images. IEEE Trans. Multimedia 18(6), 1098\u20131110 (2016)","DOI":"10.1109\/TMM.2016.2547343"},{"key":"11_CR13","unstructured":"Guo, C., Ma, Q., Zhang, L.: Spatio-temporal saliency detection using phase spectrum of quaternion Fourier transform. In: 2008 IEEE Conference on Computer Vision and Pattern Recognition, pp.\u00a01\u20138. IEEE (2008)"},{"issue":"1","key":"11_CR14","doi-asserted-by":"publisher","first-page":"19","DOI":"10.1109\/TIP.2013.2282897","volume":"23","author":"H Hadizadeh","year":"2013","unstructured":"Hadizadeh, H., Baji\u0107, I.V.: Saliency-aware video compression. IEEE Trans. Image Process. 23(1), 19\u201333 (2013)","journal-title":"IEEE Trans. Image Process."},{"key":"11_CR15","doi-asserted-by":"crossref","unstructured":"Harel, J., Koch, C., Perona, P.: Graph-based visual saliency. Adv. Neural Inf. Process. Syst. 19 (2006)","DOI":"10.7551\/mitpress\/7503.003.0073"},{"key":"11_CR16","unstructured":"Hosu, V., et\u00a0al.: AIM 2024 challenge on UHD blind photo quality assessment. In: Proceedings of the European Conference on Computer Vision (ECCV) Workshops (2024)"},{"key":"11_CR17","doi-asserted-by":"crossref","unstructured":"Hu, J., Shen, L., Sun, G.: Squeeze-and-excitation networks. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 7132\u20137141 (2018)","DOI":"10.1109\/CVPR.2018.00745"},{"issue":"11","key":"11_CR18","doi-asserted-by":"publisher","first-page":"1254","DOI":"10.1109\/34.730558","volume":"20","author":"L Itti","year":"1998","unstructured":"Itti, L., Koch, C., Niebur, E.: A model of saliency-based visual attention for rapid scene analysis. IEEE Trans. Pattern Anal. Mach. Intell. 20(11), 1254\u20131259 (1998)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"11_CR19","doi-asserted-by":"crossref","unstructured":"Jain, S., Yarlagadda, P., Jyoti, S., Karthik, S., Subramanian, R., Gandhi, V.: ViNet: pushing the limits of visual modality for audio-visual saliency prediction. In: 2021 IEEE\/RSJ International Conference on Intelligent Robots and Systems (IROS), pp. 3520\u20133527. IEEE (2021)","DOI":"10.1109\/IROS51168.2021.9635989"},{"key":"11_CR20","doi-asserted-by":"crossref","unstructured":"Jiang, L., Xu, M., Liu, T., Qiao, M., Wang, Z.: DeepVS: a deep learning based video saliency prediction approach. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 602\u2013617 (2018)","DOI":"10.1007\/978-3-030-01264-9_37"},{"key":"11_CR21","doi-asserted-by":"crossref","unstructured":"Jiang, M., Huang, S., Duan, J., Zhao, Q.: SALICON: saliency in context. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1072\u20131080 (2015)","DOI":"10.1109\/CVPR.2015.7298710"},{"key":"11_CR22","doi-asserted-by":"crossref","unstructured":"Judd, T., Ehinger, K., Durand, F., Torralba, A.: Learning to predict where humans look. In: 2009 IEEE 12th International Conference on Computer Vision, pp. 2106\u20132113. IEEE (2009)","DOI":"10.1109\/ICCV.2009.5459462"},{"key":"11_CR23","doi-asserted-by":"crossref","unstructured":"Kim, N.W., et al.: BubbleView: an interface for crowdsourcing image importance maps and tracking visual attention. ACM Trans. Comput.-Hum. Interact. (TOCHI) 24(5), 1\u201340 (2017)","DOI":"10.1145\/3131275"},{"key":"11_CR24","doi-asserted-by":"publisher","first-page":"261","DOI":"10.1016\/j.neunet.2020.05.004","volume":"129","author":"A Kroner","year":"2020","unstructured":"Kroner, A., Senden, M., Driessens, K., Goebel, R.: Contextual encoder-decoder network for visual saliency prediction. Neural Netw. 129, 261\u2013270 (2020)","journal-title":"Neural Netw."},{"key":"11_CR25","doi-asserted-by":"crossref","unstructured":"Li, J., Wen, Y., He, L.: SCConv: spatial and channel reconstruction convolution for feature redundancy. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 6153\u20136162 (2023)","DOI":"10.1109\/CVPR52729.2023.00596"},{"key":"11_CR26","doi-asserted-by":"crossref","unstructured":"Li, K., et al.: Unmasked teacher: towards training-efficient video foundation models. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 19948\u201319960 (2023)","DOI":"10.1109\/ICCV51070.2023.01826"},{"key":"11_CR27","doi-asserted-by":"crossref","unstructured":"Liu, Z., et al.: Video swin transformer. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 3202\u20133211 (2022)","DOI":"10.1109\/CVPR52688.2022.00320"},{"key":"11_CR28","doi-asserted-by":"crossref","unstructured":"Lyudvichenko, V., Erofeev, M., Gitman, Y., Vatolin, D.: A semiautomatic saliency model and its application to video compression. In: 2017 13th IEEE International Conference on Intelligent Computer Communication and Processing (ICCP), pp. 403\u2013410. IEEE (2017)","DOI":"10.1109\/ICCP.2017.8117038"},{"key":"11_CR29","doi-asserted-by":"crossref","unstructured":"Lyudvichenko, V., Vatolin, D.: Predicting video saliency using crowdsourced mouse-tracking data. In: Proceedings of the GraphiCon, pp. 127\u2013130 (2019)","DOI":"10.30987\/graphicon-2019-2-127-130"},{"issue":"1","key":"11_CR30","doi-asserted-by":"publisher","first-page":"171","DOI":"10.1109\/TPAMI.2009.112","volume":"32","author":"V Mahadevan","year":"2009","unstructured":"Mahadevan, V., Vasconcelos, N.: Spatiotemporal saliency in dynamic scenes. IEEE Trans. Pattern Anal. Mach. Intell. 32(1), 171\u2013177 (2009)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"3","key":"11_CR31","doi-asserted-by":"publisher","first-page":"231","DOI":"10.1007\/s11263-009-0215-3","volume":"82","author":"S Marat","year":"2009","unstructured":"Marat, S., Ho Phuoc, T., Granjon, L., Guyader, N., Pellerin, D., Gu\u00e9rin-Dugu\u00e9, A.: Modelling spatio-temporal saliency to predict gaze direction for short videos. Int. J. Comput. Vision 82(3), 231\u2013243 (2009)","journal-title":"Int. J. Comput. Vision"},{"key":"11_CR32","doi-asserted-by":"crossref","unstructured":"Mathe, S., Sminchisescu, C.: Actions in the eye: dynamic gaze datasets and learnt saliency models for visual recognition. IEEE Trans. Pattern Anal. Mach. Intell. 37(7), 1408\u20131424 (2014)","DOI":"10.1109\/TPAMI.2014.2366154"},{"key":"11_CR33","doi-asserted-by":"crossref","unstructured":"Miangoleh, S.M.H., Bylinskii, Z., Kee, E., Shechtman, E., Aksoy, Y.: Realistic saliency guided image enhancement. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 186\u2013194 (2023)","DOI":"10.1109\/CVPR52729.2023.00026"},{"key":"11_CR34","doi-asserted-by":"crossref","unstructured":"Min, K., Corso, J.J.: TASED-Net: temporally-aggregating spatial encoder-decoder network for video saliency detection. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 2394\u20132403 (2019)","DOI":"10.1109\/ICCV.2019.00248"},{"key":"11_CR35","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1007\/s12559-010-9074-z","volume":"3","author":"PK Mital","year":"2011","unstructured":"Mital, P.K., Smith, T.J., Hill, R.L., Henderson, J.M.: Clustering of gaze during dynamic scene viewing is predicted by motion. Cogn. Comput. 3, 5\u201324 (2011)","journal-title":"Cogn. Comput."},{"key":"11_CR36","unstructured":"Molodetskikh, I., Borisov, A., Vatolin, D.S., Timofte, R., et\u00a0al.: AIM 2024 challenge on video super-resolution quality assessment: Methods and results. In: Proceedings of the European Conference on Computer Vision (ECCV) Workshops (2024)"},{"key":"11_CR37","doi-asserted-by":"crossref","unstructured":"Moradi, M., Moradi, M., Rundo, F., Spampinato, C., Borji, A., Palazzo, S.: SalFoM: dynamic saliency prediction with video foundation models. arXiv preprint arXiv:2404.03097 (2024)","DOI":"10.1007\/978-3-031-78312-8_3"},{"key":"11_CR38","unstructured":"Nazarczuk, M., et\u00a0al.: AIM 2024 sparse neural rendering challenge: methods and results. In: Proceedings of the European Conference on Computer Vision (ECCV) Workshops (2024)"},{"key":"11_CR39","unstructured":"Nazarczuk, M., Tanay, T., Catley-Chandar, S., Shaw, R., Timofte, R., P\u00e9rez-Pellitero, E.: AIM 2024 sparse neural rendering challenge: Dataset and benchmark. In: Proceedings of the European Conference on Computer Vision (ECCV) Workshops (2024)"},{"key":"11_CR40","doi-asserted-by":"crossref","unstructured":"Papoutsaki, A., Laskey, J., Huang, J.: SearchGazer: webcam eye tracking for remote studies of web search. In: Proceedings of the 2017 Conference on Conference Human Information Interaction and Retrieval, pp. 17\u201326 (2017)","DOI":"10.1145\/3020165.3020170"},{"key":"11_CR41","doi-asserted-by":"crossref","unstructured":"Patel, Y., Appalaraju, S., Manmatha, R.: Saliency driven perceptual image compression. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, pp. 227\u2013236 (2021)","DOI":"10.1109\/WACV48630.2021.00027"},{"key":"11_CR42","unstructured":"Payne, K.: Online mouse tracking as a measure of attention in videos, using a mouse-contingent bi-resolution display. Thesis, Department of Psychological Sciences (2023). https:\/\/hdl.handle.net\/2097\/43472, master of Science"},{"key":"11_CR43","doi-asserted-by":"crossref","unstructured":"Riche, N., Duvinage, M., Mancas, M., Gosselin, B., Dutoit, T.: Saliency and human fixations: State-of-the-art and study of comparison metrics. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1153\u20131160 (2013)","DOI":"10.1109\/ICCV.2013.147"},{"key":"11_CR44","unstructured":"Rudoy, D., Goldman, D.B., Shechtman, E., Zelnik-Manor, L.: Crowdsourcing gaze data collection. arXiv preprint arXiv:1204.3367 (2012)"},{"key":"11_CR45","unstructured":"Smirnov, M., et\u00a0al.: AIM 2024 challenge on compressed video quality assessment: methods and results. In: Proceedings of the European Conference on Computer Vision (ECCV) Workshops (2024)"},{"key":"11_CR46","doi-asserted-by":"crossref","unstructured":"Tavakoli, H.R., Ahmed, F., Borji, A., Laaksonen, J.: Saliency revisited: analysis of mouse movements versus fixations. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1774\u20131782 (2017)","DOI":"10.1109\/CVPR.2017.673"},{"key":"11_CR47","unstructured":"Tavakoli, H.R., Borji, A., Rahtu, E., Kannala, J.: DAVE: a deep audio-visual embedding for dynamic saliency prediction. arXiv preprint arXiv:1905.10693 (2019)"},{"key":"11_CR48","doi-asserted-by":"crossref","unstructured":"Vig, E., Dorr, M., Cox, D.: Large-scale optimization of hierarchical features for saliency prediction in natural images. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2798\u20132805 (2014)","DOI":"10.1109\/CVPR.2014.358"},{"key":"11_CR49","doi-asserted-by":"crossref","unstructured":"Wang, W., Shen, J., Guo, F., Cheng, M.M., Borji, A.: Revisiting video saliency: a large-scale benchmark and a new model. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (2018)","DOI":"10.1109\/CVPR.2018.00514"},{"key":"11_CR50","doi-asserted-by":"crossref","unstructured":"Wang, Y., Inguva, S., Adsumilli, B.: Youtube UGC dataset for video compression research. In: 2019 IEEE 21st International Workshop on Multimedia Signal Processing (MMSP), pp.\u00a01\u20135. IEEE (2019)","DOI":"10.1109\/MMSP.2019.8901772"},{"key":"11_CR51","doi-asserted-by":"crossref","unstructured":"Xiong, J., Wang, G., Zhang, P., Huang, W., Zha, Y., Zhai, G.: CASP-Net: rethinking video saliency prediction from an audio-visual consistency perceptual perspective. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 6441\u20136450 (2023)","DOI":"10.1109\/CVPR52729.2023.00623"},{"key":"11_CR52","unstructured":"Xu, P., Ehinger, K.A., Zhang, Y., Finkelstein, A., Kulkarni, S.R., Xiao, J.: Turkergaze: crowdsourcing saliency with webcam based eye tracking. arXiv preprint arXiv:1504.06755 (2015)"},{"key":"11_CR53","doi-asserted-by":"crossref","unstructured":"Yang, S., Jiang, Q., Lin, W., Wang, Y.: SGDNet: an end-to-end saliency-guided deep neural network for no-reference image quality assessment. In: Proceedings of the 27th ACM International Conference on Multimedia, pp. 1383\u20131391 (2019)","DOI":"10.1145\/3343031.3350990"},{"key":"11_CR54","doi-asserted-by":"crossref","unstructured":"Zhang, Q.L., Yang, Y.B.: SA-Net: shuffle attention for deep convolutional neural networks. In: ICASSP 2021-2021 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 2235\u20132239. IEEE (2021)","DOI":"10.1109\/ICASSP39728.2021.9414568"},{"issue":"3","key":"11_CR55","doi-asserted-by":"publisher","first-page":"1275","DOI":"10.1109\/TIP.2017.2651410","volume":"26","author":"W Zhang","year":"2017","unstructured":"Zhang, W., Liu, H.: Study of saliency in objective video quality assessment. IEEE Trans. Image Process. 26(3), 1275\u20131288 (2017)","journal-title":"IEEE Trans. Image Process."},{"issue":"12","key":"11_CR56","doi-asserted-by":"publisher","first-page":"7696","DOI":"10.1109\/TCSVT.2023.3278410","volume":"33","author":"X Zhou","year":"2023","unstructured":"Zhou, X., et al.: Transformer-based multi-scale feature integration network for video saliency prediction. IEEE Trans. Circuits Syst. Video Technol. 33(12), 7696\u20137707 (2023)","journal-title":"IEEE Trans. Circuits Syst. Video Technol."}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2024 Workshops"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-91856-8_11","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,23]],"date-time":"2025-05-23T11:02:28Z","timestamp":1747998148000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-91856-8_11"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9783031918551","9783031918568"],"references-count":56,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-91856-8_11","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"12 May 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Milan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2024.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}