{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,12]],"date-time":"2026-05-12T21:02:27Z","timestamp":1778619747169,"version":"3.51.4"},"reference-count":43,"publisher":"Springer Science and Business Media LLC","issue":"41","license":[{"start":{"date-parts":[[2025,8,26]],"date-time":"2025-08-26T00:00:00Z","timestamp":1756166400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,8,26]],"date-time":"2025-08-26T00:00:00Z","timestamp":1756166400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"DOI":"10.1007\/s11042-025-21084-7","type":"journal-article","created":{"date-parts":[[2025,8,26]],"date-time":"2025-08-26T08:42:40Z","timestamp":1756197760000},"page":"49197-49217","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["A hybrid CNN-transformer architecture for adult image and video content recognition on the internet"],"prefix":"10.1007","volume":"84","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-9445-8044","authenticated-orcid":false,"given":"Sasan","family":"Karamizadeh","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mahdi","family":"Pourmirzaei","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mazdak","family":"Zamani","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Achyut","family":"Shankar","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,8,26]]},"reference":[{"issue":"1","key":"21084_CR1","doi-asserted-by":"publisher","first-page":"4","DOI":"10.3390\/sym13010004","volume":"13","author":"M Mulyanto","year":"2020","unstructured":"Mulyanto M, Faisal M, Prakosa SW, Leu JS (2020) Effectiveness of focal loss for minority classification in network intrusion detection systems. Symmetry 13(1):4","journal-title":"Symmetry"},{"key":"21084_CR2","doi-asserted-by":"crossref","unstructured":"Huynh VN, Nguyen HH (2021) Fast pornographic video detection using deep learning. In 2021 RIVF international conference on computing and ommunication technologies (RIVF) (pp. 1\u20136). IEEE","DOI":"10.1109\/RIVF51545.2021.9642154"},{"key":"21084_CR3","doi-asserted-by":"publisher","first-page":"123977","DOI":"10.1109\/ACCESS.2021.3109102","volume":"9","author":"H Yuan","year":"2021","unstructured":"Yuan H, Cai Z, Zhou H, Wang Y, Chen X (2021) Transanomaly: video anomaly detection using video vision transformer. IEEE Access 9:123977\u2013123986","journal-title":"IEEE Access"},{"key":"21084_CR4","doi-asserted-by":"crossref","unstructured":"Wang Q, Yuan Z, Du Q, Li X (2019) GETNET: a general end-to-end two-dimensional CNN framework for hyperspectral image change detection. CoRR abs\/1905.01662.","DOI":"10.1109\/TGRS.2018.2849692"},{"key":"21084_CR5","doi-asserted-by":"crossref","unstructured":"Gangwar A, Fidalgo E, Alegre E, Gonz\u00e1lez-Castro V (2017) Pornography and child sexual abuse detection in image and video: a comparative evaluation","DOI":"10.1049\/ic.2017.0046"},{"issue":"6","key":"21084_CR6","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1145\/3065386","volume":"60","author":"A Krizhevsky","year":"2017","unstructured":"Krizhevsky A, Sutskever I, Hinton GE (2017) Imagenet classification with deep convolutional neural networks. Commun ACM 60(6):84\u201390","journal-title":"Commun ACM"},{"key":"21084_CR7","doi-asserted-by":"crossref","unstructured":"Kumar GR, Kumar RK, Sanyal G (2017)\u00a0Discriminating real from fake smile using convolution neural network. In 2017 International Conference on Computational Intelligence in Data Science (ICCIDS) (pp. 1\u20136). IEEE","DOI":"10.1109\/ICCIDS.2017.8272651"},{"key":"21084_CR8","doi-asserted-by":"crossref","unstructured":"Tarasiewicz T, Nalepa J, Kawulok M (2020) Skinny: a lightweight U-net for skin detection and segmentation. In 2020 IEEE International Conference on Image Processing (ICIP) (pp. 2386\u20132390). IEEE","DOI":"10.1109\/ICIP40778.2020.9191209"},{"issue":"3","key":"21084_CR9","doi-asserted-by":"publisher","first-page":"202","DOI":"10.1504\/IJEF.2019.099045","volume":"9","author":"A Moradi","year":"2019","unstructured":"Moradi A, Alizadeh M, Samadi M, Yusof R (2019) Understanding the characteristicsof financial time series through neural network and SVM approaches. Int J Electron Finance 9(3):202\u2013216","journal-title":"Int J Electron Finance"},{"key":"21084_CR10","doi-asserted-by":"crossref","unstructured":"Yan H (2020) Detect and depornize pornographic images using pre-trained CNN Models. In 2020 International Conference on Computing and Data Science (CDS) (pp. 48\u201351). IEEE","DOI":"10.1109\/CDS49703.2020.00017"},{"issue":"1","key":"21084_CR11","doi-asserted-by":"publisher","first-page":"81","DOI":"10.1023\/A:1013200319198","volume":"46","author":"MJ Jones","year":"2002","unstructured":"Jones MJ, Rehg JM (2002) Statistical color models with application to skin detection. Int J Comput Vis 46(1):81\u201396","journal-title":"Int J Comput Vis"},{"key":"21084_CR12","first-page":"2999","volume":"39","author":"P Goyal","year":"2018","unstructured":"Goyal P, Kaiming H (2018) Focal loss for dense object detection. IEEE Trans Pattern Anal Mach Intell 39:2999\u20133007","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"21084_CR13","doi-asserted-by":"crossref","unstructured":"Lin TY, Goyal P, Girshick R, He K, Doll\u00e1r P (2017) Focal loss for dense object detection. In Proceedings of the IEEE international conference on computer vision (pp. 2980\u20132988)","DOI":"10.1109\/ICCV.2017.324"},{"key":"21084_CR14","doi-asserted-by":"crossref","unstructured":"Wazir ASB, Karim HA, Abdullah MHL, Mansor S (2019) Acoustic pornography recognition using recurrent neural network. In 2019 IEEE International Conference on Signal and Image Processing Applications (ICSIPA) (pp. 144\u2013148). IEEE","DOI":"10.1109\/ICSIPA45851.2019.8977794"},{"key":"21084_CR15","doi-asserted-by":"crossref","unstructured":"Jiu M, Sahbi H (2020) Image annotation based on deep hierarchical context networks. arXiv preprint arXiv:2012.11253","DOI":"10.1109\/ICASSP39728.2021.9413972"},{"key":"21084_CR16","doi-asserted-by":"crossref","unstructured":"Wiratama MR, Endah SN, Kusumaningrum R, Wibawa HA (2017) Pornography object detection using Viola-Jones algorithm and skin detection. In 2017 1st International Conference on Informatics and Computational Sciences (ICICoS) (pp. 29\u201334). IEEE","DOI":"10.1109\/ICICOS.2017.8276333"},{"key":"21084_CR17","doi-asserted-by":"publisher","first-page":"102","DOI":"10.1016\/j.neucom.2016.03.099","volume":"213","author":"C Caetano","year":"2016","unstructured":"Caetano C, Avila S, Schwartz WR, Guimar\u00e3es SJF, Ara\u00fajo AdA (2016) A mid- level video representation based on binary descriptors: a case study for pornography detection. Neurocomputing 213:102\u2013114","journal-title":"Neurocomputing"},{"issue":"2","key":"21084_CR18","doi-asserted-by":"publisher","first-page":"1041","DOI":"10.1007\/s10462-018-9664-9","volume":"52","author":"S Naji","year":"2019","unstructured":"Naji S, Jalab HA, Kareem SA (2019) A survey on skin detection in colored images. Artif Intell Rev 52(2):1041\u20131087","journal-title":"Artif Intell Rev"},{"issue":"6","key":"21084_CR19","doi-asserted-by":"publisher","first-page":"900","DOI":"10.1038\/s41591-020-0842-3","volume":"26","author":"Y Liu","year":"2020","unstructured":"Liu Y, Jain A, Eng C, Way DH, Lee K, Bui P, Coz D (2020) A deep learning system for differential diagnosis of skin diseases. Nat Med 26(6):900\u2013908","journal-title":"Nat Med"},{"key":"21084_CR20","doi-asserted-by":"publisher","first-page":"55","DOI":"10.1016\/j.neucom.2017.06.082","volume":"276","author":"S Nejatian","year":"2018","unstructured":"Nejatian S, Parvin H, Faraji E (2018) Using sub-sampling and ensemble clustering techniques to improve performance of imbalanced classification. Neurocomputing 276:55\u201366","journal-title":"Neurocomputing"},{"key":"21084_CR21","doi-asserted-by":"publisher","first-page":"307","DOI":"10.1016\/j.inffus.2018.03.001","volume":"45","author":"D Moreira","year":"2019","unstructured":"Moreira D, Avila S, Perez M, Moraes D, Testoni V, Valle E, Rocha A (2019) Multimodal data fusion for sensitive scene localization. Inf Fusion 45:307\u2013323","journal-title":"Inf Fusion"},{"issue":"1","key":"21084_CR22","doi-asserted-by":"publisher","first-page":"169","DOI":"10.1007\/s11063-020-10238-3","volume":"52","author":"W Xu","year":"2020","unstructured":"Xu W, Parvin H, Izadparast H (2020) Deep learning neural network for unconventional images classification. Neural Process Lett 52(1):169\u2013185","journal-title":"Neural Process Lett"},{"key":"21084_CR23","doi-asserted-by":"crossref","unstructured":"Karamizadeh S, Shojae Chaeikar S, Jolfaei A (2022) Adult content image recognition by boltzmann machine limited and deep learning. Evol Intell 1\u201310","DOI":"10.1007\/s12065-022-00729-8"},{"key":"21084_CR24","doi-asserted-by":"crossref","unstructured":"Lin G, Shen C, Van Den Hengel A, Reid I, Efficient piecewise training of deep structured models for semantic segmentation\u2019, in Editor (Ed.)^(Eds.): \u2018Book Efficient piecewise training of deep structured models for semantic segmentation\u2019 (2016, edn.), pp.3194\u20133203","DOI":"10.1109\/CVPR.2016.348"},{"key":"21084_CR25","doi-asserted-by":"crossref","unstructured":"Huang L, Ren X (2018) Erotic image recognition method of bagging integrated convolutional neural network. In Proceedings of the 2nd International Conference on Computer Science and Application Engineering (pp. 1\u20137)","DOI":"10.1145\/3207677.3277990"},{"key":"21084_CR26","doi-asserted-by":"publisher","first-page":"49925","DOI":"10.1109\/ACCESS.2018.2868813","volume":"6","author":"L Yuan","year":"2018","unstructured":"Yuan L, Wei X, Shen H, Zeng LL, Hu D (2018) Multi-center brain imaging classification using a novel 3D CNN approach. IEEE Access 6:49925\u201349934","journal-title":"IEEE Access"},{"key":"21084_CR27","doi-asserted-by":"crossref","unstructured":"Tabone A, Camilleri K, Bonnici A, Cristina S, Farrugia R, Borg M (2021) Pornographic content classification using deep-learning. In Proceedings of the 21st ACM Symposium on Document Engineering (pp. 1\u201310)","DOI":"10.1145\/3469096.3469867"},{"key":"21084_CR28","doi-asserted-by":"publisher","DOI":"10.1016\/j.cmpb.2021.106586","volume":"214","author":"J Zhang","year":"2022","unstructured":"Zhang J, Li C, Liu G, Min M, Wang C, Li J, Chen H (2022) A CNN-transformer hybrid approach for decoding visual neural activity into text. Comput Methods Programs Biomed 214:106586","journal-title":"Comput Methods Programs Biomed"},{"key":"21084_CR29","doi-asserted-by":"publisher","first-page":"81","DOI":"10.1016\/j.neucom.2021.02.056","volume":"445","author":"A Gangwar","year":"2021","unstructured":"Gangwar A, Gonz\u00e1lez-Castro V, Alegre E, Fidalgo E (2021) AttM-CNN: attention and metric learning based CNN for pornography, age and child sexual abuse (CSA) detection in images. Neurocomputing 445:81\u2013104","journal-title":"Neurocomputing"},{"issue":"7","key":"21084_CR30","doi-asserted-by":"publisher","first-page":"4367","DOI":"10.1007\/s10489-020-02116-1","volume":"51","author":"Y Chen","year":"2021","unstructured":"Chen Y, Liu L, Phonevilay V, Gu K, Xia R, Xie J, Yang K (2021) Image super-resolution reconstruction based on feature map attention mechanism. Appl Intell 51(7):4367\u20134380","journal-title":"Appl Intell"},{"key":"21084_CR31","doi-asserted-by":"publisher","first-page":"46","DOI":"10.1016\/j.forsciint.2016.09.010","volume":"268","author":"D Moreira","year":"2016","unstructured":"Moreira D, Avila S, Perez M, Moraes D, Testoni V, Valle E, Rocha A (2016) Pornography classification: the hidden clues in video space\u2013time. Forensic Sci Int 268:46\u201361","journal-title":"Forensic Sci Int"},{"key":"21084_CR32","doi-asserted-by":"publisher","first-page":"122709","DOI":"10.1109\/ACCESS.2020.2988736","volume":"8","author":"J Chen","year":"2020","unstructured":"Chen J, Liang G, He W, Xu C, Yang J, Liu R (2020) A pornographic images recognition model based on deep one-class classification with visual attention mechanism. IEEE Access 8:122709\u2013122721","journal-title":"IEEE Access"},{"issue":"1","key":"21084_CR33","doi-asserted-by":"publisher","first-page":"26","DOI":"10.3390\/sym13010026","volume":"13","author":"N AlDahoul","year":"2020","unstructured":"AlDahoul N, Karim A, Lye Abdullah H, Fauzi MHA, Wazir MFB, Mansor AS, S., See J (2020) Transfer detection of YOLO to focus cnn\u2019s attention on nude regions for adult content detection. Symmetry 13(1):26","journal-title":"Symmetry"},{"key":"21084_CR34","doi-asserted-by":"publisher","first-page":"432","DOI":"10.1016\/j.neucom.2017.07.012","volume":"272","author":"J Wehrmann","year":"2018","unstructured":"Wehrmann J, Sim\u00f5es GS, Barros RC, Cavalcante VF (2018) Adult content detection in videos with convolutional and recurrent neural networks. Neurocomputing 272:432\u2013438","journal-title":"Neurocomputing"},{"issue":"3","key":"21084_CR35","first-page":"1481","volume":"25","author":"DD Phan","year":"2022","unstructured":"Phan DD, Nguyen QH, Nguyen TT, Tran HL, Vu DL (2022) Joint inter-intra representation learning for pornographic video classification. Indones J Electr Eng Comput Sci 25(3):1481\u20131488","journal-title":"Indones J Electr Eng Comput Sci"},{"key":"21084_CR36","doi-asserted-by":"crossref","unstructured":"AlDahoul N, Karim HA, Wazir ASB, Momo MA, Abdullah MHL (2021)\u00a0A comparative study of in-domain vs cross-domain learning for porn cartoon classification. In 2021 IEEE International Conference on Signal and Image Processing Applications (ICSIPA) (pp. 60\u201365). IEEE","DOI":"10.1109\/ICSIPA52582.2021.9576769"},{"issue":"4","key":"21084_CR37","doi-asserted-by":"publisher","DOI":"10.3390\/diagnostics13040686","volume":"13","author":"S Fekri-Ershad","year":"2023","unstructured":"Fekri-Ershad S, Alsaffar MF (2023) Developing a tuned three-layer perceptron fed with trained deep convolutional neural networks for cervical cancer diagnosis. Diagnostics 13(4):686","journal-title":"Diagnostics"},{"key":"21084_CR38","unstructured":"Moustafa M (2015) Applying deep learning to classify pornographic images and videos. ArXiv Preprint arXiv :151108899"},{"key":"21084_CR39","doi-asserted-by":"crossref","unstructured":"Shah U, Aqmar M, Nakazawa M, Stenger B (2021) Content filtering in streaming video using domain adaptation. In 2021 17th International Conference on Machine Vision and Applications (MVA) (pp. 1\u20136). IEEE","DOI":"10.23919\/MVA51890.2021.9511364"},{"key":"21084_CR40","doi-asserted-by":"crossref","unstructured":"Lu Z, Li J, Liu H, Huang C, Zhang L, Zeng T (2022)\u00a0Transformer for single image super-resolution. In Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (pp. 457\u2013466)","DOI":"10.1109\/CVPRW56347.2022.00061"},{"key":"21084_CR41","doi-asserted-by":"crossref","unstructured":"Liu Z, Hu H, Lin Y, Yao Z, Xie Z, Wei Y, ... Guo B (2022) Swin transformer v2: Scaling up capacity and resolution. In Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (pp. 12009\u201312019)","DOI":"10.1109\/CVPR52688.2022.01170"},{"issue":"1","key":"21084_CR42","doi-asserted-by":"publisher","first-page":"73","DOI":"10.1007\/s13042-020-01157-9","volume":"12","author":"X Lin","year":"2021","unstructured":"Lin X, Qin F, Peng Y, Shao Y (2021) Fine-grained pornographic image recognition with multiple feature fusion transfer learning. Int J Mach Learn Cybernet 12(1):73\u201386","journal-title":"Int J Mach Learn Cybernet"},{"issue":"19","key":"21084_CR43","doi-asserted-by":"publisher","first-page":"28739","DOI":"10.1007\/s11042-023-14437-7","volume":"82","author":"S Samal","year":"2023","unstructured":"Samal S, Nayak R, Jena S, Balabantaray BK (2023) Obscene image detection using transfer learning and feature fusion. Multimedia Tools Appl 82(19):28739\u201328767","journal-title":"Multimedia Tools Appl"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-025-21084-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-025-21084-7","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-025-21084-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,12,25]],"date-time":"2025-12-25T15:23:12Z","timestamp":1766676192000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-025-21084-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,8,26]]},"references-count":43,"journal-issue":{"issue":"41","published-online":{"date-parts":[[2025,12]]}},"alternative-id":["21084"],"URL":"https:\/\/doi.org\/10.1007\/s11042-025-21084-7","relation":{},"ISSN":["1573-7721"],"issn-type":[{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,8,26]]},"assertion":[{"value":"20 August 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"22 April 2025","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 July 2025","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"26 August 2025","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}]}}