{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,10]],"date-time":"2026-03-10T15:27:22Z","timestamp":1773156442393,"version":"3.50.1"},"reference-count":38,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2023,4,13]],"date-time":"2023-04-13T00:00:00Z","timestamp":1681344000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0"},{"start":{"date-parts":[[2023,4,13]],"date-time":"2023-04-13T00:00:00Z","timestamp":1681344000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0"}],"funder":[{"name":"Spanish Ministerio de Ciencia y Innovaci\u00f3n","award":["TALENT (PID2020-116417RB-C41)"],"award-info":[{"award-number":["TALENT (PID2020-116417RB-C41)"]}]},{"name":"Spanish Ministerio de Ciencia y Innovaci\u00f3n","award":["TALENT (PID2020-116417RB-C41)"],"award-info":[{"award-number":["TALENT (PID2020-116417RB-C41)"]}]},{"name":"Spanish Ministerio de Ciencia y Innovaci\u00f3n","award":["TALENT (PID2020-116417RB-C41)"],"award-info":[{"award-number":["TALENT (PID2020-116417RB-C41)"]}]},{"name":"Spanish Ministerio de Ciencia y Innovaci\u00f3n","award":["TALENT (PID2020-116417RB-C41)"],"award-info":[{"award-number":["TALENT (PID2020-116417RB-C41)"]}]},{"name":"Portuguese national funds through Funda\u00e7\u00e3o para a Ci\u00eancia e a Tecnologia","award":["UIDB\/50021\/2020"],"award-info":[{"award-number":["UIDB\/50021\/2020"]}]},{"DOI":"10.13039\/501100003759","name":"Universidad Polit\u00e9cnica de Madrid","doi-asserted-by":"crossref","id":[{"id":"10.13039\/501100003759","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Real-Time Image Proc"],"published-print":{"date-parts":[[2023,6]]},"abstract":"<jats:title>Abstract<\/jats:title>\n                  <jats:p>This paper presents a GPU-based parallelisation of an optimised versatile video decoder (VVC) adaptive loop filter (ALF) filter on a resource-constrained heterogeneous platform. The GPU has been comprehensively utilised to maximise the degree of parallelism, making the programme capable of exploiting the GPU capabilities. The proposed approach enables to accelerate the ALF computation by an average of two times when compared to an already fully optimised version of the software decoder implementation over an embedded platform. Finally, this work presents an analysis of energy consumption, showing that the proposed methodology has a negligible impact on this key parameter.<\/jats:p>","DOI":"10.1007\/s11554-023-01300-z","type":"journal-article","created":{"date-parts":[[2023,4,13]],"date-time":"2023-04-13T11:04:11Z","timestamp":1681383851000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["GPU-based parallelisation of a versatile video coding adaptive loop filter in resource-constrained heterogeneous embedded platform"],"prefix":"10.1007","volume":"20","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2268-3642","authenticated-orcid":false,"given":"Anup","family":"Saha","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2491-4977","authenticated-orcid":false,"given":"Nuno","family":"Roma","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0280-3440","authenticated-orcid":false,"given":"Miguel","family":"Chavarr\u00edas","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7445-5823","authenticated-orcid":false,"given":"Tiago","family":"Dias","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3610-4296","authenticated-orcid":false,"given":"Fernando","family":"Pescador","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3885-1068","authenticated-orcid":false,"given":"V\u00edctor","family":"Aranda","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,4,13]]},"reference":[{"key":"1300_CR1","unstructured":"Fraunhofer HHI is proud to present the new state-of-the-art in global video coding: H.266\/VVC brings video transmission to new speed. https:\/\/newsletter.fraunhofer.de\/-viewonline2\/17386\/465\/11\/14SHcBTt\/V44RELLZBp\/1 (2022). Accessed 5 Jun (2022)"},{"key":"1300_CR2","unstructured":"JCT-VC.: High efficient video coding (HEVC), ITU-T Recommendation H.265 and ISO\/IEC 23008-2, ITU-T and ISO\/IEC JTC 1. (2013)"},{"key":"1300_CR3","unstructured":"Feldmann, C.: Versatile video coding hits major milestone. https:\/\/bitmovin.com\/compression-standards-vvc-2020 (2022). Accessed 05 June (2022)"},{"key":"1300_CR4","doi-asserted-by":"publisher","first-page":"3134","DOI":"10.1109\/ICIP40778.2020.9190983","volume":"2020","author":"F Pakdaman","year":"2020","unstructured":"Pakdaman, F., Adelimanesh, M.A., Gabbouj, M., Hashemi, M.R.: Complexity analysis of next-generation VVC encoding and decoding. IEEE Int. Conf. Image Process. (ICIP) 2020, 3134\u20133138 (2020). https:\/\/doi.org\/10.1109\/ICIP40778.2020.9190983","journal-title":"IEEE Int. Conf. Image Process. (ICIP)"},{"key":"1300_CR5","doi-asserted-by":"publisher","first-page":"3320","DOI":"10.3390\/s21103320","volume":"21","author":"A Saha","year":"2021","unstructured":"Saha, A., Chavarr\u00edas, M., Pescador, F., Groba, \u00c1.M., Chassaigne, K., Cebri\u00e1n, P.L.: Complexity analysis of a versatile video coding decoder over embedded systems and general purpose processors. Sensors 21, 3320 (2021). https:\/\/doi.org\/10.3390\/s21103320","journal-title":"Sensors"},{"key":"1300_CR6","unstructured":"Franklin, D.: NVIDIA Jetson AGX Xavier Delivers 32 TeraOps for New Era of AI in Robotics, y. https:\/\/developer.nvidia.com\/blog\/nvidia-jetson-agx-xavier-32-teraops-ai-robotics\/ (2022). Accessed 07 June 2022"},{"key":"1300_CR7","doi-asserted-by":"publisher","first-page":"246","DOI":"10.1109\/BigMM.2016.66","volume":"2016","author":"S Li","year":"2016","unstructured":"Li, S., Wang, R., Yao, K.: CUDA acceleration for AVS2 loop filtering. IEEE Second Int. Conf. Multimed. Big Data (BigMM) 2016, 246\u2013250 (2016). https:\/\/doi.org\/10.1109\/BigMM.2016.66","journal-title":"IEEE Second Int. Conf. Multimed. Big Data (BigMM)"},{"key":"1300_CR8","doi-asserted-by":"publisher","first-page":"3124","DOI":"10.1109\/ICIP40778.2020.9191199","volume":"2020","author":"A Wieckowski","year":"2020","unstructured":"Wieckowski, A., et al.: Towards a live software decoder implementation for the upcoming versatile video coding (VVC) codec. IEEE Int. Conf. Image Process. (ICIP) 2020, 3124\u20133128 (2020). https:\/\/doi.org\/10.1109\/ICIP40778.2020.9191199","journal-title":"IEEE Int. Conf. Image Process. (ICIP)"},{"key":"1300_CR9","doi-asserted-by":"publisher","DOI":"10.1145\/3339825.3391871","author":"S Gudumasu","year":"2020","unstructured":"Gudumasu, S., Bandyopadhyay, S., He, Y.: Software-based versatile video coding decoder parallelization. Proc. ACM Multimed. Syst. Conf. (2020). https:\/\/doi.org\/10.1145\/3339825.3391871","journal-title":"Proc. ACM Multimed. Syst. Conf."},{"key":"1300_CR10","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/ICME51207.2021.9428470","volume":"2021","author":"B Zhu","year":"2021","unstructured":"Zhu, B., et al.: A real-time H.266, VVC software decoder. IEEE Int. Conf. Multimed. Expo (ICME) 2021, 1\u20136 (2021). https:\/\/doi.org\/10.1109\/ICME51207.2021.9428470","journal-title":"IEEE Int. Conf. Multimed. Expo (ICME)"},{"key":"1300_CR11","doi-asserted-by":"publisher","DOI":"10.1109\/PCS50896.2021.9477484","author":"Y Li","year":"2021","unstructured":"Li, Y., et al.: An optimized H266\/VVC software decoder on mobile platform. Pict. Coding Symp. (PCS) (2021). https:\/\/doi.org\/10.1109\/PCS50896.2021.9477484","journal-title":"Pict. Coding Symp. (PCS)"},{"key":"1300_CR12","doi-asserted-by":"publisher","first-page":"1196","DOI":"10.1109\/ICIP40778.2020.9190708","volume":"2020","author":"X Han","year":"2020","unstructured":"Han, X., Wang, S., Ma, S., Gao, W.: Optimization of motion compensation based On GPU and CPU For VVC decoding. IEEE Int. Conf. Image Process. (ICIP) 2020, 1196\u20131200 (2020). https:\/\/doi.org\/10.1109\/ICIP40778.2020.9190708","journal-title":"IEEE Int. Conf. Image Process. (ICIP)"},{"key":"1300_CR13","doi-asserted-by":"crossref","unstructured":"V\u00e1zquez, M.F., Saha, A., Morillas, R.M., Lapastora M.C., Oso, F.P. D.: Work-in-progress: porting new versatile video coding transforms to a heterogeneous GPU-based technology. In: International Conference on Compliers, Architectures and Synthesis for Embedded Systems, pp. 1\u20132 (2019)","DOI":"10.1145\/3349569.3351540"},{"key":"1300_CR14","unstructured":"OpenHEVC software repository. https:\/\/github.com\/OpenHEVC\/openHEVC (2022). Accessed 14 May 2022"},{"issue":"3","key":"1300_CR15","doi-asserted-by":"publisher","first-page":"276","DOI":"10.1109\/TCE.2018.2867812","volume":"64","author":"Y Wang","year":"2018","unstructured":"Wang, Y., Guo, X., Fan, X., Lu, Y., Zhao, D., Gao, W.: Parallel in-loop filtering in HEVC encoder on GPU. IEEE Trans. Consum. Electron. 64(3), 276\u2013284 (2018). https:\/\/doi.org\/10.1109\/TCE.2018.2867812","journal-title":"IEEE Trans. Consum. Electron."},{"key":"1300_CR16","doi-asserted-by":"publisher","DOI":"10.1109\/SAMOS.2015.7363667","author":"DF de Souza","year":"2015","unstructured":"de Souza, D.F., Ilic, A., Roma, N., Sousa, L.: HEVC in-loop filters GPU parallelization in embedded systems. Int. Conf. Embed. Comput. Syst. (2015). https:\/\/doi.org\/10.1109\/SAMOS.2015.7363667","journal-title":"Int. Conf. Embed. Comput. Syst."},{"issue":"2","key":"1300_CR17","doi-asserted-by":"publisher","first-page":"531","DOI":"10.1007\/s11554-015-0519-1","volume":"12","author":"DF de Souza","year":"2016","unstructured":"de Souza, D.F., Ilic, A., Roma, N., Sousa, L.: GPU-assisted HEVC intra decoder. J. Real-Time Image Proc. 12(2), 531\u2013547 (2016). https:\/\/doi.org\/10.1007\/s11554-015-0519-1","journal-title":"J. Real-Time Image Proc."},{"key":"1300_CR18","doi-asserted-by":"publisher","first-page":"323","DOI":"10.1109\/ICIST.2017.7926778","volume":"2017","author":"A Ma","year":"2017","unstructured":"Ma, A., Guo, C.: Parallel acceleration of HEVC decoder based on CPU+GPU heterogeneous platform. Seventh Int. Conf. Inf. Sci. Technol. (ICIST) 2017, 323\u2013330 (2017). https:\/\/doi.org\/10.1109\/ICIST.2017.7926778","journal-title":"Seventh Int. Conf. Inf. Sci. Technol. (ICIST)"},{"key":"1300_CR19","doi-asserted-by":"publisher","first-page":"181","DOI":"10.1109\/ICIST.2016.7483407","volume":"2016","author":"W Zhang","year":"2016","unstructured":"Zhang, W., Guo, C.: Design and implementation of parallel algorithms for sample adaptive offset in HEVC based on GPU. Sixth Int. Conf. Inf. Sci. Technol. (ICIST) 2016, 181\u2013187 (2016). https:\/\/doi.org\/10.1109\/ICIST.2016.7483407","journal-title":"Sixth Int. Conf. Inf. Sci. Technol. (ICIST)"},{"key":"1300_CR20","doi-asserted-by":"crossref","unstructured":"Ma, S., Huang, T., Wen, G.: The second generation IEEE, video coding standard. In: IEEE China Summit and International Conferece on Signal and Information Processing, p. 2015 (1857)","DOI":"10.1109\/ChinaSIP.2015.7230385"},{"key":"1300_CR21","doi-asserted-by":"publisher","DOI":"10.1109\/MIPR49039.2020.00061","author":"B Jiang","year":"2020","unstructured":"Jiang, B., Xu, H., Luo, F., Wang, S., Ma, S., Gao, W.: GPU-based intra decompression for 8K real-time AVS3 decoder. IEEE Conf. Multimed. Inf. Process. Retr. (MIPR) (2020). https:\/\/doi.org\/10.1109\/MIPR49039.2020.00061","journal-title":"IEEE Conf. Multimed. Inf. Process. Retr. (MIPR)"},{"key":"1300_CR22","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/ICMEW46912.2020.9106009","volume":"2020","author":"X Han","year":"2020","unstructured":"Han, X., et al.: GPU based Real-Time UHD Intra Decoding for AVS3. IEEE Int. Conf. Multimed. Expo Worksh. (ICMEW) 2020, 1\u20136 (2020). https:\/\/doi.org\/10.1109\/ICMEW46912.2020.9106009","journal-title":"IEEE Int. Conf. Multimed. Expo Worksh. (ICMEW)"},{"key":"1300_CR23","unstructured":"Jiaqi, Z., Chuanmin, J., Meng, L., Shanshe, W., Siwei, M., Wen, J.: Gao. Recent development of AVS video coding standard : Avs3. In: 2019 Picture Coding Symposium (PCS), IEEE, pp. 311\u2013315 (2019)"},{"key":"1300_CR24","doi-asserted-by":"publisher","first-page":"65361","DOI":"10.1109\/ACCESS.2021.3075875","volume":"9","author":"D Karwowski","year":"2021","unstructured":"Karwowski, D.: Precise probability estimation of symbols in VVC CABAC entropy encoder. IEEE Access 9, 65361\u201365368 (2021). https:\/\/doi.org\/10.1109\/ACCESS.2021.3075875","journal-title":"IEEE Access"},{"issue":"10","key":"1300_CR25","doi-asserted-by":"publisher","first-page":"3907","DOI":"10.1109\/TCSVT.2021.3072297","volume":"31","author":"M Karczewicz","year":"2021","unstructured":"Karczewicz, M., et al.: VVC in-loop filters. IEEE Trans. Circuits Syst. Video Technol. 31(10), 3907\u20133925 (2021). https:\/\/doi.org\/10.1109\/TCSVT.2021.3072297","journal-title":"IEEE Trans. Circuits Syst. Video Technol."},{"issue":"6","key":"1300_CR26","doi-asserted-by":"publisher","first-page":"934","DOI":"10.1109\/JSTSP.2013.2271974","volume":"7","author":"C-Y Tsai","year":"2013","unstructured":"Tsai, C.-Y., et al.: Adaptive loop filtering for video coding. IEEE J. Sel. Top. Signal Process. 7(6), 934\u2013945 (2013). https:\/\/doi.org\/10.1109\/JSTSP.2013.2271974","journal-title":"IEEE J. Sel. Top. Signal Process."},{"key":"1300_CR27","doi-asserted-by":"publisher","first-page":"28","DOI":"10.1017\/ATSIP.2019.19","volume":"8","author":"J Erfurt","year":"2019","unstructured":"Erfurt, J., et al.: Extended multiple feature-based classifications for adaptive loop filtering. APSIPA Trans. Signal Inf. Process. 8, 28 (2019). https:\/\/doi.org\/10.1017\/ATSIP.2019.19","journal-title":"APSIPA Trans. Signal Inf. Process."},{"key":"1300_CR28","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/ASICON52560.2021.9620332","volume":"2021","author":"X Wang","year":"2021","unstructured":"Wang, X., Sun, H., Katto, J., Fan, Y.: A hardware architecture for adaptive loop filter in VVC decoder. IEEE 14 Int. Conf. ASIC (ASICON) 2021, 1\u20134 (2021). https:\/\/doi.org\/10.1109\/ASICON52560.2021.9620332","journal-title":"IEEE 14 Int. Conf. ASIC (ASICON)"},{"key":"1300_CR29","unstructured":"Fraunhofer HHI VVdeC Software Repository. https:\/\/github.com\/fraunhoferhhi\/vvdec (2022). Accessed 02 July 2022"},{"key":"1300_CR30","unstructured":"Ffmpeg.: A complete, cross-platform solution to record, convert and stream audio and video. https:\/\/ffmpeg.org\/ (2022). Accessed 22 Aug 2022"},{"key":"1300_CR31","unstructured":"GPAC: Multimedia Open Source Project. https:\/\/gpac.wp.imt.fr\/ (2022). Accessed 22 Aug 2022"},{"key":"1300_CR32","doi-asserted-by":"publisher","DOI":"10.1109\/TCE.2022.3202512","author":"A Saha","year":"2022","unstructured":"Saha, A., Chavarr\u00edas, M., Aranda, V., Garrido, M.J., Pescador, F.: Implementation of a real-time versatile video coding decoder based on VVdeC over an embedded multi-core platform. IEEE Trans. Consum. Electron. (2022). https:\/\/doi.org\/10.1109\/TCE.2022.3202512","journal-title":"IEEE Trans. Consum. Electron."},{"key":"1300_CR33","unstructured":"Fraunhofer HHI VVdeC software repository, Releases vvdec-0.2.0.0. https:\/\/github.com\/fraunhoferhhi\/vvdec\/releases\/tag\/v0.2.0.0 (2022). Accessed 27 Apr 2022"},{"key":"1300_CR34","unstructured":"Saha, A.: VVdeC2_ARM_Neon. https:\/\/github.com\/Sahamec\/VVdeC2_ARM_Neon (2022). Accessed 19 May 2022"},{"key":"1300_CR35","doi-asserted-by":"publisher","DOI":"10.1109\/ICICCT.2017.7975190","author":"NV Sunitha","year":"2017","unstructured":"Sunitha, N.V., Raju, K., Chiplunkar, N.N.: Performance improvement of CUDA applications by reducing CPU-GPU data transfer overhead. Int. Conf. Invent. Commun. Comput. Technol. (ICICCT) (2017). https:\/\/doi.org\/10.1109\/ICICCT.2017.7975190","journal-title":"Int. Conf. Invent. Commun. Comput. Technol. (ICICCT)"},{"key":"1300_CR36","unstructured":"Ponnuraj, R.P.: CUDA memory model. https:\/\/medium.com\/analytics-vidhya\/cuda-memory-model-823f02cef0bf (2022). Accessed 12 Aug 2022"},{"key":"1300_CR37","unstructured":"NVIDIA Jetson AGX Xavier Developer Kit, User Guide. DA_09403_003, December 17, 2019. https:\/\/developer.nvidia.com\/jetson-agx-xavier-developer-kit-user-guide (2022). Accessed 06 July 2022"},{"key":"1300_CR38","unstructured":"Bossen, F., Boyce, J., Li, X., Seregin, V., S\u00fchring, K.: JVET common test conditions and software reference configurations for SDR Video, Document JVET-N1010. JVET of ITU-T, Geneva (2019)"}],"container-title":["Journal of Real-Time Image Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11554-023-01300-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11554-023-01300-z\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11554-023-01300-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,6,3]],"date-time":"2023-06-03T07:16:38Z","timestamp":1685776598000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11554-023-01300-z"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,4,13]]},"references-count":38,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2023,6]]}},"alternative-id":["1300"],"URL":"https:\/\/doi.org\/10.1007\/s11554-023-01300-z","relation":{"has-preprint":[{"id-type":"doi","id":"10.21203\/rs.3.rs-2381512\/v1","asserted-by":"object"}]},"ISSN":["1861-8200","1861-8219"],"issn-type":[{"value":"1861-8200","type":"print"},{"value":"1861-8219","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,4,13]]},"assertion":[{"value":"15 December 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 March 2023","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 April 2023","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"43"}}