{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,8]],"date-time":"2026-04-08T16:33:05Z","timestamp":1775665985073,"version":"3.50.1"},"reference-count":88,"publisher":"Springer Science and Business Media LLC","issue":"12","license":[{"start":{"date-parts":[[2023,5,17]],"date-time":"2023-05-17T00:00:00Z","timestamp":1684281600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,5,17]],"date-time":"2023-05-17T00:00:00Z","timestamp":1684281600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"DOI":"10.1007\/s11042-023-15774-3","type":"journal-article","created":{"date-parts":[[2023,5,17]],"date-time":"2023-05-17T08:04:35Z","timestamp":1684310675000},"page":"36519-36546","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["Using two-stream EfficientNet-BiLSTM network for multiclass classification of disturbing YouTube videos"],"prefix":"10.1007","volume":"83","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2198-6932","authenticated-orcid":false,"given":"Kanwal","family":"Yousaf","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tabassam","family":"Nawaz","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Adnan","family":"Habib","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2023,5,17]]},"reference":[{"key":"15774_CR1","unstructured":"Abadi M, Barham P, Chen J, Chen Z, Davis A, Dean J, Devin M, Ghemawat S, Irving G, Isard M (2016) Tensorflow: a system for large-scale machine learning. In: 12th USENIX symposium on operating systems design and implementation (OSDI' 16).\u00a0USENIX, pp 265\u2013283. Available at: https:\/\/www.usenix.org\/system\/files\/conference\/osdi16\/osdi16-abadi.pdf"},{"key":"15774_CR2","unstructured":"Abu-El-Haija S, Kothari N, Lee J, Natsev P, Toderici G, Varadarajan B, Vijayanarasimhan S (2016) Youtube-8m: a large-scale video classification benchmark. arXiv preprint arXiv:1609.08675. Available at: https:\/\/arxiv.org\/abs\/1609.08675"},{"key":"15774_CR3","doi-asserted-by":"publisher","first-page":"39910","DOI":"10.1109\/ACCESS.2021.3064392","volume":"9","author":"N Aldahoul","year":"2021","unstructured":"Aldahoul N, Karim HA, Abdullah MHL, Wazir ASB, Fauzi MFA, Tan MJT, Mansor S, Lyn HS (2021) An evaluation of traditional and CNN-based feature descriptors for cartoon pornography detection. IEEE Access 9:39910\u201339925. https:\/\/doi.org\/10.1109\/ACCESS.2021.3064392","journal-title":"IEEE Access"},{"key":"15774_CR4","doi-asserted-by":"publisher","unstructured":"Alghowinem S (2018) A safer youtube kids: an extra layer of content filtering using automated multimodal analysis. In: Proceedings of SAI Intelligent Systems Conference. Springer, pp. 294\u2013308. https:\/\/doi.org\/10.1007\/978-3-030-01054-6_21","DOI":"10.1007\/978-3-030-01054-6_21"},{"key":"15774_CR5","doi-asserted-by":"publisher","unstructured":"Ali A, Senan N (2018) Violence video classification performance using deep neural networks. In: International conference on soft computing and data mining. Springer, pp. 225\u2013233. https:\/\/doi.org\/10.1007\/978-3-319-72550-5_22","DOI":"10.1007\/978-3-319-72550-5_22"},{"key":"15774_CR6","doi-asserted-by":"publisher","first-page":"508","DOI":"10.1145\/3442442.3452314","volume":"2021","author":"S Alshamrani","year":"2021","unstructured":"Alshamrani S, Abusnaina A, Abuhamad M, Nyang D, Mohaisen D (2021) Hate, obscenity, and insults: measuring the exposure of children to inappropriate comments in YouTube. Companion Proceedings of the Web Conference 2021:508\u2013515. https:\/\/doi.org\/10.1145\/3442442.3452314","journal-title":"Companion Proceedings of the Web Conference"},{"key":"15774_CR7","doi-asserted-by":"publisher","first-page":"19","DOI":"10.1080\/15456870.2015.972404","volume":"23","author":"Y Ariel","year":"2015","unstructured":"Ariel Y, Avidar R (2015) Information, interactivity, and social media. Atlantic J Commun 23:19\u201330. https:\/\/doi.org\/10.1080\/15456870.2015.972404","journal-title":"Atlantic J Commun"},{"key":"15774_CR8","unstructured":"Brandom R (2017) Inside elsagate, the conspiracy fueled war on creepy youtube kids videos. The Verge. www.theverge.com\/2017\/12\/8\/16751206\/elsagate-youtube-kids-creepy-conspiracy-theory. Accessed\u00a010 Sep 2021"},{"key":"15774_CR9","doi-asserted-by":"publisher","first-page":"205630511770718","DOI":"10.1177\/2056305117707189","volume":"3","author":"B Burroughs","year":"2017","unstructured":"Burroughs B (2017) YouTube kids: the app economy and mobile parenting. Soc Med Soc 3:2056305117707189. https:\/\/doi.org\/10.1177\/2056305117707189","journal-title":"Soc Med Soc"},{"key":"15774_CR10","doi-asserted-by":"publisher","first-page":"348","DOI":"10.1001\/archpedi.160.4.348","volume":"160","author":"BJ Bushman","year":"2006","unstructured":"Bushman BJ, Huesmann LR (2006) Short-term and long-term effects of violent media on aggression in children and adults. Arch Pediatr Adolesc Med 160:348\u2013352. https:\/\/doi.org\/10.1001\/archpedi.160.4.348","journal-title":"Arch Pediatr Adolesc Med"},{"key":"15774_CR11","unstructured":"Caetano C, Avila S, Guimaraes S, Ara\u00fajo ADA (2014) Pornography detection using bossanova video descriptor. In: 2014 22nd European signal processing conference (EUSIPCO). IEEE, pp 1681\u20131685. Available at: https:\/\/ieeexplore.ieee.org\/document\/6952616"},{"key":"15774_CR12","unstructured":"Ceci L (2021) Global number of YouTube viewers 2016\u20132021. https:\/\/www.statista.com\/statistics\/805656\/number-youtube-viewers-worldwide\/. Accessed 1 Nov 2021"},{"key":"15774_CR13","unstructured":"Ceci L (2021) YouTube - Statistics & Facts. https:\/\/www.statista.com\/topics\/2019\/youtube\/. Accessed\u00a01 Sep 2021"},{"key":"15774_CR14","doi-asserted-by":"publisher","first-page":"77","DOI":"10.1177\/1329878X17693700","volume":"163","author":"D Craig","year":"2017","unstructured":"Craig D, Cunningham S (2017) Toy unboxing: living in a (n unregulated) material world. Med Int Aust 163:77\u201386. https:\/\/doi.org\/10.1177\/1329878X17693700","journal-title":"Med Int Aust"},{"key":"15774_CR15","doi-asserted-by":"publisher","unstructured":"Dadvar M, Eckert K (2020) Cyberbullying detection in social networks using deep learning based models. In: International conference on big data analytics and knowledge discovery. Springer, pp. 245\u2013255. https:\/\/doi.org\/10.1201\/9781003134527-11","DOI":"10.1201\/9781003134527-11"},{"key":"15774_CR16","unstructured":"Defendant's opposition WDI (2018) The YouTube service and terms of use. https:\/\/digitalcommons.law.scu.edu\/cgi\/viewcontent.cgi?article=2680&context=historical. Accessed 22 Dec 2021"},{"key":"15774_CR17","doi-asserted-by":"publisher","unstructured":"Deng J, Dong W, Socher R, Li L-J, Li K, Fei-Fei L (2009) Imagenet: A large-scale hierarchical image database. In: 2009 IEEE conference on computer vision and pattern recognition. IEEE, pp 248\u2013255. https:\/\/doi.org\/10.1109\/cvprw.2009.5206848","DOI":"10.1109\/cvprw.2009.5206848"},{"key":"15774_CR18","doi-asserted-by":"publisher","unstructured":"Deselaers T, Pimenidis L, Ney H (2008) Bag-of-visual-words models for adult image classification and filtering. In: 2008 19th International Conference on Pattern Recognition. IEEE, pp 1\u20134. https:\/\/doi.org\/10.1109\/ICPR.2008.4761366","DOI":"10.1109\/ICPR.2008.4761366"},{"key":"15774_CR19","doi-asserted-by":"publisher","unstructured":"Ding C, Fan S, Zhu M, Feng W, Jia B (2014) Violence detection in video by using 3D convolutional neural networks. In: International Symposium on Visual Computing (ISVC 2014). Springer, pp 551\u2013558. https:\/\/doi.org\/10.1007\/978-3-319-14364-4_53","DOI":"10.1007\/978-3-319-14364-4_53"},{"key":"15774_CR20","doi-asserted-by":"publisher","unstructured":"Elias N and Sulkin I (2017) YouTube viewers in diapers: an exploration of factors associated with amount of toddlers\u2019 online viewing. Cyberpsych J Psychosoc Res Cyberspace 11. https:\/\/doi.org\/10.5817\/cp2017-3-2","DOI":"10.5817\/cp2017-3-2"},{"key":"15774_CR21","doi-asserted-by":"publisher","unstructured":"Farneb\u00e4ck G (2003) Two-frame motion estimation based on polynomial expansion. In: Scandinavian conference on Image analysis. Springer,\u00a0Berlin, Heidelberg, pp 363\u2013370. https:\/\/doi.org\/10.1007\/3-540-45103-X_50","DOI":"10.1007\/3-540-45103-X_50"},{"key":"15774_CR22","doi-asserted-by":"publisher","first-page":"88","DOI":"10.1016\/j.chb.2017.10.041","volume":"80","author":"A Ferchaud","year":"2018","unstructured":"Ferchaud A, Grzeslo J, Orme S, LaGroue J (2018) Parasocial attributes and YouTube personalities: exploring content trends across the most subscribed YouTube channels. Comput Hum Behav 80:88\u201396. https:\/\/doi.org\/10.1016\/j.chb.2017.10.041","journal-title":"Comput Hum Behav"},{"key":"15774_CR23","doi-asserted-by":"publisher","unstructured":"Fleck MM, Forsyth DA, Bregler C (1996) Finding naked people. In: European conference on computer vision. Springer,\u00a0Berlin, Heidelberg, pp 593\u2013602. https:\/\/doi.org\/10.1007\/3-540-61123-1_173","DOI":"10.1007\/3-540-61123-1_173"},{"key":"15774_CR24","doi-asserted-by":"publisher","first-page":"63","DOI":"10.1023\/A:1008145029462","volume":"32","author":"DA Forsyth","year":"1999","unstructured":"Forsyth DA, Fleck MM (1999) Automatic detection of human nudes. Int J Comput Vis 32:63\u201377. https:\/\/doi.org\/10.1023\/A:1008145029462","journal-title":"Int J Comput Vis"},{"key":"15774_CR25","doi-asserted-by":"publisher","unstructured":"Forsyth DA, Fleck MM (1997) Body plans. In: Proceedings of IEEE computer society conference on computer vision and pattern recognition. IEEE, pp 678\u2013683. https:\/\/doi.org\/10.1109\/CVPR.1997.609399","DOI":"10.1109\/CVPR.1997.609399"},{"key":"15774_CR26","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1016\/j.imavis.2016.01.006","volume":"48","author":"Y Gao","year":"2016","unstructured":"Gao Y, Liu H, Sun X, Wang C, Liu Y (2016) Violence detection using oriented violent flows. Image Vis Comput 48:37\u201341. https:\/\/doi.org\/10.1016\/j.imavis.2016.01.006","journal-title":"Image Vis Comput"},{"key":"15774_CR27","doi-asserted-by":"publisher","first-page":"602","DOI":"10.1016\/j.neunet.2005.06.042","volume":"18","author":"A Graves","year":"2005","unstructured":"Graves A, Schmidhuber J (2005) Framewise phoneme classification with bidirectional LSTM and other neural network architectures. Neural Netw 18:602\u2013610. https:\/\/doi.org\/10.1016\/j.neunet.2005.06.042","journal-title":"Neural Netw"},{"key":"15774_CR28","doi-asserted-by":"publisher","unstructured":"Hanson A, Pnvr K, Krishnagopal S, Davis L (2019) Bidirectional convolutional lstm for the detection of violence in videos. In: Proceedings of the European Conference on Computer Vision (ECCV) Workshops.\u00a0Springer, Cham, pp 280\u2013295. https:\/\/doi.org\/10.1007\/978-3-030-11012-3_24","DOI":"10.1007\/978-3-030-11012-3_24"},{"key":"15774_CR29","doi-asserted-by":"publisher","unstructured":"Hassner T, Itcher Y, Kliper-Gross O (2012) Violent flows: Real-time detection of violent crowd behavior. In: 2012 IEEE computer society conference on computer vision and pattern recognition workshops. IEEE, pp 1\u20136. https:\/\/doi.org\/10.1109\/CVPRW.2012.6239348","DOI":"10.1109\/CVPRW.2012.6239348"},{"key":"15774_CR30","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S Hochreiter","year":"1997","unstructured":"Hochreiter S, Schmidhuber J (1997) Long short-term memory. Neural Comput 9:1735\u20131780. https:\/\/doi.org\/10.1162\/neco.1997.9.8.1735","journal-title":"Neural Comput"},{"key":"15774_CR31","doi-asserted-by":"publisher","unstructured":"Hou C, Wu X, Wang G (2018) End-to-end bloody video recognition by audio-visual feature fusion. In: Chinese conference on pattern recognition and computer vision (PRCV). Springer, pp 501\u2013510. https:\/\/doi.org\/10.1007\/978-3-030-03398-9_43","DOI":"10.1007\/978-3-030-03398-9_43"},{"key":"15774_CR32","doi-asserted-by":"publisher","unstructured":"Ishikawa A, Bollis E, Avila S (2019) Combating the elsagate phenomenon: deep learning architectures for disturbing cartoons. In: 2019 7th international workshop on biometrics and forensics (IWBF). IEEE, pp 1\u20136. https:\/\/doi.org\/10.1109\/iwbf.2019.8739202","DOI":"10.1109\/iwbf.2019.8739202"},{"key":"15774_CR33","doi-asserted-by":"publisher","unstructured":"Jansohn C, Ulges A, Breuel TM (2009) Detecting pornographic video content by combining image features with motion information. In: Proceedings of the 17th ACM international conference on multimedia. ACM,\u00a0New York, NY, pp 601\u2013604. https:\/\/doi.org\/10.1145\/1631272.1631366","DOI":"10.1145\/1631272.1631366"},{"key":"15774_CR34","doi-asserted-by":"publisher","first-page":"81","DOI":"10.1109\/cvpr.1999.786951","volume":"46","author":"MJ Jones","year":"2002","unstructured":"Jones MJ, Rehg JM (2002) Statistical color models with application to skin detection. Int J Comput Vis 46:81\u201396. https:\/\/doi.org\/10.1109\/cvpr.1999.786951","journal-title":"Int J Comput Vis"},{"key":"15774_CR35","doi-asserted-by":"publisher","first-page":"696","DOI":"10.1109\/tce.2014.7027345","volume":"60","author":"S Jung","year":"2014","unstructured":"Jung S, Youn J, Sull S (2014) A real-time system for detecting indecent videos based on spatiotemporal patterns. IEEE Trans Consum Electron 60:696\u2013701. https:\/\/doi.org\/10.1109\/tce.2014.7027345","journal-title":"IEEE Trans Consum Electron"},{"key":"15774_CR36","doi-asserted-by":"publisher","unstructured":"Karpathy A, Toderici G, Shetty S, Leung T, Sukthankar R, Fei-Fei L (2014) Large-scale video classification with convolutional neural networks. In: Proceedings of the IEEE conference on Computer Vision and Pattern Recognition. IEEE,\u00a0Columbus, OH, pp 1725\u20131732. https:\/\/doi.org\/10.1109\/cvpr.2014.223","DOI":"10.1109\/cvpr.2014.223"},{"key":"15774_CR37","doi-asserted-by":"publisher","unstructured":"Kaushal R, Saha S, Bajaj P, Kumaraguru P (2016) KidsTube: detection, characterization and analysis of child unsafe content & promoters on YouTube. In: 2016 14th annual conference on privacy, Security and Trust (PST). IEEE, pp 157\u2013164. https:\/\/doi.org\/10.1109\/pst.2016.7906950","DOI":"10.1109\/pst.2016.7906950"},{"key":"15774_CR38","doi-asserted-by":"publisher","unstructured":"Kay W, Carreira J, Simonyan K, Zhang B, Hillier C, Vijayanarasimhan S, Viola F, Green T, Back T, Natsev P (2017) The kinetics human action video dataset. arXiv preprint arXiv:1705.06950. https:\/\/doi.org\/10.48550\/arXiv.1705.06950","DOI":"10.48550\/arXiv.1705.06950"},{"key":"15774_CR39","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1145\/3065386","volume":"60","author":"A Krizhevsky","year":"2017","unstructured":"Krizhevsky A, Sutskever I, Hinton GE (2017) ImageNet classification with deep convolutional neural networks. Commun ACM 60:84\u201390. https:\/\/doi.org\/10.1145\/3065386","journal-title":"Commun ACM"},{"key":"15774_CR40","doi-asserted-by":"publisher","unstructured":"Kuehne H, Jhuang H, Garrote E, Poggio T, Serre T (2011) HMDB: a large video database for human motion recognition. In: 2011 international conference on computer vision. IEEE, pp 2556\u20132563. https:\/\/doi.org\/10.1007\/978-3-642-33374-3_41","DOI":"10.1007\/978-3-642-33374-3_41"},{"key":"15774_CR41","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1007\/s11263-005-1838-7","volume":"64","author":"I Laptev","year":"2005","unstructured":"Laptev I (2005) On space-time interest points. Int J Comput Vis 64:107\u2013123. https:\/\/doi.org\/10.1007\/s11263-005-1838-7","journal-title":"Int J Comput Vis"},{"key":"15774_CR42","doi-asserted-by":"publisher","first-page":"677","DOI":"10.1109\/tce.2009.5174439","volume":"55","author":"S Lee","year":"2009","unstructured":"Lee S, Shim W, Kim S (2009) Hierarchical system for objectionable video detection. IEEE Trans Consum Electron 55:677\u2013684. https:\/\/doi.org\/10.1109\/tce.2009.5174439","journal-title":"IEEE Trans Consum Electron"},{"key":"15774_CR43","doi-asserted-by":"publisher","first-page":"301022","DOI":"10.1016\/j.fsidi.2020.301022","volume":"34","author":"H-E Lee","year":"2020","unstructured":"Lee H-E, Ermakova T, Ververis V, Fabian B (2020) Detecting child sexual abuse material: a comprehensive survey. Forensic Sci Int Digit Invest 34:301022. https:\/\/doi.org\/10.1016\/j.fsidi.2020.301022","journal-title":"Forensic Sci Int Digit Invest"},{"key":"15774_CR44","doi-asserted-by":"publisher","unstructured":"Liu Y, Wang X, Zhang Y, Tang S (2011) Fusing audio-words with visual features for pornographic video detection. In: 2011 IEEE 10th international conference on trust, security and privacy in computing and communications. IEEE, pp 1488-1493. https:\/\/doi.org\/10.1109\/trustcom.2011.205","DOI":"10.1109\/trustcom.2011.205"},{"key":"15774_CR45","doi-asserted-by":"publisher","first-page":"69","DOI":"10.1016\/j.future.2012.08.012","volume":"31","author":"Y Liu","year":"2014","unstructured":"Liu Y, Yang Y, Xie H, Tang S (2014) Fusing audio vocabulary with visual features for pornographic video detection. Futur Gener Comput Syst 31:69\u201376. https:\/\/doi.org\/10.1016\/j.future.2012.08.012","journal-title":"Futur Gener Comput Syst"},{"key":"15774_CR46","unstructured":"Livingstone S, Haddon L, G\u00f6rzig A, \u00d3lafsson K (2011) Risks and safety on the internet: the perspective of European children: full findings and policy implications from the EU kids online survey of 9-16 year olds and their parents in 25 countries. In, EU kids online network, London, UK. Available at: http:\/\/eprints.lse.ac.uk\/id\/eprint\/33731"},{"key":"15774_CR47","doi-asserted-by":"publisher","unstructured":"Lopes APB, de Avila SE, Peixoto AN, Oliveira RS, Coelho MDM, and Ara\u00fajo ADA (2009) Nude detection in video using bag-of-visual-features. In: 2009 XXII Brazilian Symposium on Computer Graphics and Image Processing. IEEE, pp 224\u2013231. https:\/\/doi.org\/10.1109\/sibgrapi.2009.32","DOI":"10.1109\/sibgrapi.2009.32"},{"key":"15774_CR48","unstructured":"Maheshwari S (2017) On YouTube Kids, startling videos slip past filters. The New York Times. https:\/\/www.nytimes.com\/2017\/11\/04\/business\/media\/youtube-kids-paw-patrol.html. Accessed 23 Nov 2021"},{"key":"15774_CR49","doi-asserted-by":"publisher","unstructured":"Mariconti E, Suarez-Tangil G, Blackburn J, De Cristofaro E, Kourtellis N, Leontiadis I, Serrano JL, Stringhini G (2019) \u201cYou know what to do\u201d proactive detection of YouTube videos targeted by coordinated hate attacks. Proceedings of the ACM on Human-Computer Interaction 3:1\u201321. https:\/\/doi.org\/10.1145\/3359309","DOI":"10.1145\/3359309"},{"key":"15774_CR50","doi-asserted-by":"publisher","unstructured":"Mohaouchane H, Mourhir A, Nikolov NS (2019) Detecting offensive language on arabic social media using deep learning. In: 2019 sixth international conference on social networks analysis, Management and Security (SNAMS). IEEE, pp. 466\u2013471. https:\/\/doi.org\/10.1109\/snams.2019.8931839","DOI":"10.1109\/snams.2019.8931839"},{"key":"15774_CR51","doi-asserted-by":"publisher","first-page":"46","DOI":"10.1016\/j.forsciint.2016.09.010","volume":"268","author":"D Moreira","year":"2016","unstructured":"Moreira D, Avila S, Perez M, Moraes D, Testoni V, Valle E, Goldenstein S, Rocha A (2016) Pornography classification: the hidden clues in video space\u2013time. Forensic Sci Int 268:46\u201361. https:\/\/doi.org\/10.1016\/j.forsciint.2016.09.010","journal-title":"Forensic Sci Int"},{"key":"15774_CR52","doi-asserted-by":"publisher","unstructured":"Moustafa M (2015) Applying deep learning to classify pornographic images and videos. arXiv preprint arXiv:1511.08899. https:\/\/doi.org\/10.48550\/arXiv.1511.08899","DOI":"10.48550\/arXiv.1511.08899"},{"key":"15774_CR53","doi-asserted-by":"publisher","first-page":"4459","DOI":"10.1007\/s10639-020-10183-7","volume":"25","author":"MM Neumann","year":"2020","unstructured":"Neumann MM, Herodotou C (2020) Evaluating YouTube videos for young children. Educ Inf Technol 25:4459\u20134475. https:\/\/doi.org\/10.1007\/s10639-020-10183-7","journal-title":"Educ Inf Technol"},{"key":"15774_CR54","doi-asserted-by":"publisher","first-page":"72","DOI":"10.1007\/s10639-020-10183-7","volume":"96","author":"MM Neumann","year":"2020","unstructured":"Neumann MM, Herodotou C (2020) Young children and YouTube: a global phenomenon. Child Educ 96:72\u201377. https:\/\/doi.org\/10.1007\/s10639-020-10183-7","journal-title":"Child Educ"},{"key":"15774_CR55","doi-asserted-by":"publisher","unstructured":"Nievas EB, Suarez OD, Garc\u00eda GB, Sukthankar R (2011) Violence detection in video using computer vision techniques. In: International conference on Computer analysis of images and patterns. Springer,\u00a0Berlin, Heidelberg, pp 332\u2013339. https:\/\/doi.org\/10.1007\/978-3-642-23678-5_39","DOI":"10.1007\/978-3-642-23678-5_39"},{"key":"15774_CR56","doi-asserted-by":"publisher","unstructured":"Ochoa VMT, Yayilgan SY, Cheikh FA (2012) Adult video content detection using machine learning techniques. In: 2012 eighth international conference on signal image technology and internet based systems. IEEE, pp 967-974. https:\/\/doi.org\/10.1109\/sitis.2012.143","DOI":"10.1109\/sitis.2012.143"},{"key":"15774_CR57","doi-asserted-by":"crossref","unstructured":"Papadamou K, Papasavva A, Zannettou S, Blackburn J, Kourtellis N, Leontiadis I, Stringhini G, Sirivianos M (2020) Disturbed YouTube for kids: characterizing and detecting inappropriate videos targeting young children. In: Proceedings of the international AAAI conference on web and social media. pp. 522\u2013533. Available at: https:\/\/ojs.aaai.org\/index.php\/ICWSM\/article\/view\/7320\/7174","DOI":"10.1609\/icwsm.v14i1.7320"},{"key":"15774_CR58","doi-asserted-by":"publisher","unstructured":"Peixoto BM, Avila S, Dias Z, and Rocha A (2018) Breaking down violence: a deep-learning strategy to model and classify violence in videos. In: Proceedings of the 13th International Conference on Availability, Reliability and Security (ARES 2018). ACM,\u00a0New York, NY, pp 1\u20137. https:\/\/doi.org\/10.1145\/3230833.3232809","DOI":"10.1145\/3230833.3232809"},{"key":"15774_CR59","doi-asserted-by":"publisher","first-page":"279","DOI":"10.1016\/j.neucom.2016.12.017","volume":"230","author":"M Perez","year":"2017","unstructured":"Perez M, Avila S, Moreira D, Moraes D, Testoni V, Valle E, Goldenstein S, Rocha A (2017) Video pornography detection through deep learning techniques and motion information. Neurocomputing 230:279\u2013293. https:\/\/doi.org\/10.1016\/j.neucom.2016.12.017","journal-title":"Neurocomputing"},{"key":"15774_CR60","doi-asserted-by":"publisher","unstructured":"Rea N, Lacey G, Dahyot R, Lambe C (2006) Multimodal periodicity analysis for illicit content detection in videos https:\/\/doi.org\/10.1049\/cp:20061978","DOI":"10.1049\/cp:20061978"},{"key":"15774_CR61","unstructured":"Reddit (2017) What is ElsaGate? https:\/\/www.reddit.com\/r\/ElsaGate\/comments\/6o6baf\/. Accessed 10 Sep 2021"},{"key":"15774_CR62","doi-asserted-by":"publisher","unstructured":"Simonyan K, Zisserman A (2014) Two-stream convolutional networks for action recognition in videos. In: NIPS'14: procs of the 27th Intl Conf. on neural information processing systems. MIT Press,\u00a0Cambridge, MA, pp 568\u2013576. https:\/\/doi.org\/10.5555\/2968826.2968890","DOI":"10.5555\/2968826.2968890"},{"key":"15774_CR63","doi-asserted-by":"publisher","unstructured":"Simonyan K, Zisserman A (2014) Very deep convolutional networks for large-scale image recognition. arXiv preprint arXiv:1409.1556. https:\/\/doi.org\/10.48550\/arXiv.1409.1556","DOI":"10.48550\/arXiv.1409.1556"},{"key":"15774_CR64","doi-asserted-by":"publisher","unstructured":"Singh S, Kaushal R, Buduru AB, Kumaraguru P (2019) KidsGUARD: fine grained approach for child unsafe video representation and detection. In: Proceedings of the 34th ACM\/SIGAPP symposium on applied computing. ACM,\u00a0New York, NY, pp 2104\u20132111. https:\/\/doi.org\/10.1145\/3297280.3297487","DOI":"10.1145\/3297280.3297487"},{"key":"15774_CR65","doi-asserted-by":"publisher","first-page":"102","DOI":"10.1016\/j.intmar.2012.01.002","volume":"26","author":"AN Smith","year":"2012","unstructured":"Smith AN, Fischer E, Yongjian C (2012) How does brand-related user-generated content differ across YouTube, Facebook, and twitter? J Interact Mark 26:102\u2013113. https:\/\/doi.org\/10.1016\/j.intmar.2012.01.002","journal-title":"J Interact Mark"},{"key":"15774_CR66","doi-asserted-by":"publisher","unstructured":"Soomro K, Zamir AR, Shah M (2012) UCF101: a dataset of 101 human actions classes from videos in the wild. arXiv preprint arXiv:1212.0402. https:\/\/doi.org\/10.48550\/arXiv.1212.0402","DOI":"10.48550\/arXiv.1212.0402"},{"key":"15774_CR67","doi-asserted-by":"publisher","first-page":"613","DOI":"10.1109\/ccdc.2019.8832598","volume":"1","author":"SA Sumon","year":"2019","unstructured":"Sumon SA, Shahria T, Goni R, Hasan N, Almarufuzzaman A, Rahman RM (2019) Violent crowd flow detection using deep learning. In: ACIIDS 1:613\u2013625. https:\/\/doi.org\/10.1109\/ccdc.2019.8832598","journal-title":"In: ACIIDS"},{"key":"15774_CR68","doi-asserted-by":"publisher","unstructured":"Sutskever I, Vinyals O, Le QV (2014) Sequence to sequence learning with neural networks. In: Advances in neural information processing systems (NIPS'14). MIT Press,\u00a0Cambridge, MA, pp 3104\u20133112. https:\/\/doi.org\/10.5555\/2969033.2969173","DOI":"10.5555\/2969033.2969173"},{"key":"15774_CR69","doi-asserted-by":"publisher","unstructured":"Szegedy C, Vanhoucke V, Ioffe S, Shlens J, Wojna Z (2016) Rethinking the inception architecture for computer vision. In: Proceedings of the IEEE conference on computer vision and pattern recognition. IEEE,\u00a0Las Vegas, NV, pp 2818\u20132826. https:\/\/doi.org\/10.1109\/cvpr.2016.308","DOI":"10.1109\/cvpr.2016.308"},{"key":"15774_CR70","doi-asserted-by":"publisher","unstructured":"Tahir R, Ahmed F, Saeed H, Ali S, Zaffar F, Wilson C (2019) Bringing the kid back into youtube kids: detecting inappropriate content on video streaming platforms. In: 2019 IEEE\/ACM international conference on advances in social networks analysis and mining (ASONAM). IEEE,\u00a0Vancouver, BC, pp 464\u2013469. https:\/\/doi.org\/10.1145\/3341161.3342913","DOI":"10.1145\/3341161.3342913"},{"key":"15774_CR71","doi-asserted-by":"publisher","unstructured":"Tan M, Le Q (2019) Efficientnet: rethinking model scaling for convolutional neural networks. In: international conference on machine learning. PMLR, pp 6105-6114. https:\/\/doi.org\/10.48550\/arXiv.1905.11946","DOI":"10.48550\/arXiv.1905.11946"},{"key":"15774_CR72","doi-asserted-by":"publisher","unstructured":"Tang S, Li J, Zhang Y, Xie C, Li M, Liu Y, Hua X, Zheng Y-T, Tang J, Chua T-S (2009) Pornprobe: an lda-svm based pornography detection system. In: proceedings of the 17th ACM international conference on multimedia. Pp 1003-1004. https:\/\/doi.org\/10.1145\/1631272.1631490","DOI":"10.1145\/1631272.1631490"},{"key":"15774_CR73","doi-asserted-by":"publisher","unstructured":"Trana RE, Gomez CE, Adler RF (2020) Fighting cyberbullying: an analysis of algorithms used to detect harassing text found on YouTube. In: International conference on applied human factors and ergonomics. Springer, pp. 9\u201315. https:\/\/doi.org\/10.1007\/978-3-030-51328-3_2","DOI":"10.1007\/978-3-030-51328-3_2"},{"key":"15774_CR74","doi-asserted-by":"publisher","unstructured":"Ulges A, Schulze C, Borth D, Stahl A (2012) Pornography detection in video benefits (a lot) from a multi-modal approach. In: Proceedings of the 2012 ACM international workshop on audio and multimedia methods for large-scale video analysis (AMVA '12). ACM,\u00a0New York, NY, pp 21\u201326. https:\/\/doi.org\/10.1145\/2390214.2390222","DOI":"10.1145\/2390214.2390222"},{"key":"15774_CR75","doi-asserted-by":"publisher","first-page":"303","DOI":"10.1016\/j.jvcir.2017.12.005","volume":"50","author":"P Vitorino","year":"2018","unstructured":"Vitorino P, Avila S, Perez M, Rocha A (2018) Leveraging deep neural networks to fight child pornography in the age of social media. J Vis Commun Image Represent 50:303\u2013313. https:\/\/doi.org\/10.1016\/j.jvcir.2017.12.005","journal-title":"J Vis Commun Image Represent"},{"key":"15774_CR76","doi-asserted-by":"publisher","first-page":"60","DOI":"10.1007\/s11263-012-0594-8","volume":"103","author":"H Wang","year":"2013","unstructured":"Wang H, Kl\u00e4ser A, Schmid C, Liu C-L (2013) Dense trajectories and motion boundary descriptors for action recognition. Int J Comput Vis 103:60\u201379. https:\/\/doi.org\/10.1007\/s11263-012-0594-8","journal-title":"Int J Comput Vis"},{"key":"15774_CR77","doi-asserted-by":"publisher","first-page":"432","DOI":"10.1016\/j.neucom.2017.07.012","volume":"272","author":"J Wehrmann","year":"2018","unstructured":"Wehrmann J, Sim\u00f5es GS, Barros RC, Cavalcante VF (2018) Adult content detection in videos with convolutional and recurrent neural networks. Neurocomputing 272:432\u2013438. https:\/\/doi.org\/10.1016\/j.neucom.2017.07.012","journal-title":"Neurocomputing"},{"key":"15774_CR78","unstructured":"Wikipedia (2019) TV Parental Guidelines. https:\/\/en.wikipedia.org\/wiki\/TV_Parental_Guidelines. Accessed 1 Aug 2019"},{"key":"15774_CR79","first-page":"8","volume":"10","author":"H Wilson","year":"2020","unstructured":"Wilson H (2020) Youtube is unsafe for children: Youtube's safeguards and the current legal framework are inadequate to protect children from disturbing content. Seattle J Technol Environ Innov Law 10:8 Available at: https:\/\/digitalcommons.law.seattleu.edu\/sjteil\/vol10\/iss1\/8","journal-title":"Seattle J Technol Environ Innov Law"},{"key":"15774_CR80","doi-asserted-by":"publisher","unstructured":"Wolf L, Hassner T, Maoz I (2011) Face recognition in unconstrained videos with matched background similarity. In: CVPR 2011. IEEE, pp 529-534. https:\/\/doi.org\/10.1109\/cvpr.2011.5995566","DOI":"10.1109\/cvpr.2011.5995566"},{"key":"15774_CR81","doi-asserted-by":"publisher","unstructured":"Wu Z, Wang X, Jiang Y-G, Ye H, Xue X (2015) Modeling spatial-temporal clues in a hybrid deep learning framework for video classification. In: proceedings of the 23rd ACM international conference on multimedia. ACM, pp 461-470. https:\/\/doi.org\/10.1145\/2733373.2806222","DOI":"10.1145\/2733373.2806222"},{"key":"15774_CR82","doi-asserted-by":"publisher","unstructured":"Wu Z, Jiang Y-G, Wang X, Ye H, Xue X, Wang J (2015) Fusing multi-stream deep networks for video classification. arXiv preprint arXiv:1509.06086. https:\/\/doi.org\/10.48550\/arXiv.1509.06086","DOI":"10.48550\/arXiv.1509.06086"},{"key":"15774_CR83","doi-asserted-by":"publisher","unstructured":"Ye H, Wu Z, Zhao R-W, Wang X, Jiang Y-G, Xue X (2015) Evaluating two-stream CNN for video classification. In: Proceedings of the 5th ACM on International Conference on Multimedia Retrieval (ICMR '15). ACM,\u00a0New York, NY, pp 435\u2013442. https:\/\/doi.org\/10.1145\/2671188.2749406","DOI":"10.1145\/2671188.2749406"},{"key":"15774_CR84","doi-asserted-by":"publisher","first-page":"273","DOI":"10.1007\/s41060-017-0088-4","volume":"6","author":"H Yenala","year":"2018","unstructured":"Yenala H, Jhanwar A, Chinnakotla MK, Goyal J (2018) Deep learning for detecting inappropriate content in text. Int J Data Sci Anal 6:273\u2013286. https:\/\/doi.org\/10.1007\/s41060-017-0088-4","journal-title":"Int J Data Sci Anal"},{"key":"15774_CR85","doi-asserted-by":"publisher","first-page":"16283","DOI":"10.1109\/ACCESS.2022.3147519","volume":"10","author":"K Yousaf","year":"2022","unstructured":"Yousaf K, Nawaz T (2022) A deep learning-based approach for inappropriate content detection and classification of YouTube videos. IEEE Access 10:16283\u201316298. https:\/\/doi.org\/10.1109\/ACCESS.2022.3147519","journal-title":"IEEE Access"},{"key":"15774_CR86","doi-asserted-by":"publisher","unstructured":"Yue-Hei Ng J, Hausknecht M, Vijayanarasimhan S, Vinyals O, Monga R, Toderici G (2015) Beyond short snippets: deep networks for video classification. In: Proceedings of the IEEE conference on computer vision and pattern recognition. IEEE, pp 4694\u20134702. https:\/\/doi.org\/10.1109\/cvpr.2015.7299101","DOI":"10.1109\/cvpr.2015.7299101"},{"key":"15774_CR87","doi-asserted-by":"publisher","unstructured":"Zach C, Pock T, and Bischof H (2007) A duality based approach for realtime TV-L 1 Optical Flow. In: Joint pattern recognition symposium. Springer,\u00a0Berlin, Heidelberg, pp 214\u2013223. https:\/\/doi.org\/10.1007\/978-3-540-74936-3_22","DOI":"10.1007\/978-3-540-74936-3_22"},{"key":"15774_CR88","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s13640-020-00501-x","volume":"2020","author":"Y Zhao","year":"2020","unstructured":"Zhao Y, Man KL, Smith J, Siddique K, Guan S-U (2020) Improved two-stream model for human action recognition. EURASIP J Image Vid Process 2020:1\u20139. https:\/\/doi.org\/10.1186\/s13640-020-00501-x","journal-title":"EURASIP J Image Vid Process"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-023-15774-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-023-15774-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-023-15774-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,4,2]],"date-time":"2024-04-02T13:09:57Z","timestamp":1712063397000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-023-15774-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,5,17]]},"references-count":88,"journal-issue":{"issue":"12","published-online":{"date-parts":[[2024,4]]}},"alternative-id":["15774"],"URL":"https:\/\/doi.org\/10.1007\/s11042-023-15774-3","relation":{},"ISSN":["1573-7721"],"issn-type":[{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,5,17]]},"assertion":[{"value":"21 May 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 March 2023","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 May 2023","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 May 2023","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"9 December 2023","order":5,"name":"change_date","label":"Change Date","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"Update","order":6,"name":"change_type","label":"Change Type","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"Note: Minor corrections in equations 1 to 5 due to tilde placement.","order":7,"name":"change_details","label":"Change Details","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"This article does not contain any studies with human participants or animals performed by any of the\nauthors.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Research involving human participants and\/or animals"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Informed consent"}},{"value":"Not applicable.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval"}},{"value":"The authors have no competing interests to declare that are relevant to the content of this article.","order":5,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}]}}