{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,17]],"date-time":"2026-06-17T19:57:15Z","timestamp":1781726235296,"version":"3.54.5"},"reference-count":54,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"2","license":[{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"funder":[{"name":"European Union under the Italian National Recovery and Resilience Plan (NRRP) Mission 4, Component 2, Investment 1.3","award":["CUP C93C22005250001"],"award-info":[{"award-number":["CUP C93C22005250001"]}]},{"name":"\"Telecommunications of the Future\u201d","award":["PE00000001"],"award-info":[{"award-number":["PE00000001"]}]},{"name":"European Union\u2019s Horizon Europe Program","award":["101135637"],"award-info":[{"award-number":["101135637"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. on Broadcast."],"published-print":{"date-parts":[[2026,6]]},"DOI":"10.1109\/tbc.2026.3668621","type":"journal-article","created":{"date-parts":[[2026,3,6]],"date-time":"2026-03-06T21:00:03Z","timestamp":1772830803000},"page":"533-544","source":"Crossref","is-referenced-by-count":0,"title":["SalFormer360: A Transformer-Based Saliency Estimation Model for 360-Degree Videos"],"prefix":"10.1109","volume":"72","author":[{"ORCID":"https:\/\/orcid.org\/0009-0003-4911-3698","authenticated-orcid":false,"given":"Mahmoud Z. A.","family":"Wahba","sequence":"first","affiliation":[{"name":"Department of Information Engineering, University of Padova, Padua, Italy"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9893-5813","authenticated-orcid":false,"given":"Francesco","family":"Barbato","sequence":"additional","affiliation":[{"name":"Department of Information Engineering, University of Padova, Padua, Italy"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5642-3430","authenticated-orcid":false,"given":"Sara","family":"Baldoni","sequence":"additional","affiliation":[{"name":"Department of Information Engineering, University of Padova, Padua, Italy"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0846-5879","authenticated-orcid":false,"given":"Federica","family":"Battisti","sequence":"additional","affiliation":[{"name":"Department of Information Engineering, University of Padova, Padua, Italy"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref1","volume-title":"Requirements for Mobile Edge Computing-enabled Content Delivery Networks","year":"2019"},{"key":"ref2","doi-asserted-by":"crossref","first-page":"53","DOI":"10.1016\/j.image.2018.03.008","article-title":"A feature-based approach for saliency estimation of omni-directional images","volume":"69","author":"Battisti","year":"2018","journal-title":"Signal Process., Image Commun."},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/WCNC57260.2024.10571028"},{"issue":"8","key":"ref4","doi-asserted-by":"crossref","first-page":"4016","DOI":"10.3390\/s23084016","article-title":"Enhancing 360 video streaming through salient content in head-mounted displays","volume":"23","author":"Nguyen","year":"2023","journal-title":"Sensors"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2021.3070520"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2019.2931807"},{"key":"ref7","first-page":"162","article-title":"Spherical convolution-based saliency detection for FoV prediction in 360-degree video streaming","volume-title":"Proc. Int. Wireless Commun. Mobile Comput. (IWCMC)","author":"Shuai"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICME52920.2022.9859963"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2024.3398548"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/MNET.2025.3548276"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2024.3513221"},{"key":"ref12","article-title":"SegFormer: Simple and efficient design for semantic segmentation with transformers","author":"Xie","year":"2021","journal-title":"arXiv:2105.15203"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2018.2858783"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00559"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01234-2_30"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2022.04.080"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00248"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2021.3139743"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2019.2924417"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6927"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58558-7_25"},{"key":"ref22","article-title":"MobileNets: Efficient convolutional neural networks for mobile vision applications","author":"Howard","year":"2017","journal-title":"arXiv:1704.04861"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ISPA58351.2023.10279300"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1145\/3240508.3240669"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP40778.2020.9191331"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1038\/s41598-025-16011-7"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ICMEW.2018.8551543"},{"key":"ref28","article-title":"SalGAN: Visual saliency prediction with generative adversarial networks","author":"Pan","year":"2017","journal-title":"arXiv:1701.01081"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1145\/3422622"},{"key":"ref30","article-title":"Panoramic convolutions for 360\u00b0 single-image saliency prediction","volume-title":"Proc. CVPR Workshop Comput. Vis. Augmented Virtual Reality","author":"Martin"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01240-3_32"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2019.2957986"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/MMSP64401.2025.11324125"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-24574-4_28"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00154"},{"key":"ref36","article-title":"Convolutional LSTM network: A machine learning approach for precipitation nowcasting","author":"Shi","year":"2015","journal-title":"arXiv:1506.04214"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2023.3269564"},{"key":"ref38","first-page":"305","article-title":"ATSal: An attention based architecture for saliency prediction in 360 videos","volume-title":"Proc. Int. Conf. Pattern Recognit.","author":"Dahou"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1145\/3511603"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/JETCAS.2024.3377096"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/tmm.2023.3306596"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2019.2955824"},{"key":"ref43","first-page":"200","article-title":"SST-sal: A spherical spatio-temporal approach for saliency prediction in 360\u00b0 videos","volume":"10","author":"Bernal","year":"2022","journal-title":"Jornada de J\u00f3venes Investigadores del"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2024.3407685"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00436"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2021.3126590"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1145\/3565024"},{"key":"ref48","article-title":"Attention is all you need","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"30","author":"Vaswani"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-018-1140-0"},{"key":"ref51","first-page":"8026","article-title":"PyTorch: An imperative style, high-performance deep learning library","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"32","author":"Paszke"},{"key":"ref52","volume-title":"Torchvision: PyTorch\u2019s Computer Vision Library [software]","year":"2016"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2018.2815601"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/QoMEX.2018.8463369"}],"container-title":["IEEE Transactions on Broadcasting"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11\/11563690\/11424030.pdf?arnumber=11424030","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,6,17]],"date-time":"2026-06-17T19:38:02Z","timestamp":1781725082000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11424030\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,6]]},"references-count":54,"journal-issue":{"issue":"2"},"URL":"https:\/\/doi.org\/10.1109\/tbc.2026.3668621","relation":{},"ISSN":["0018-9316","1557-9611"],"issn-type":[{"value":"0018-9316","type":"print"},{"value":"1557-9611","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,6]]}}}