{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,1]],"date-time":"2025-11-01T09:36:32Z","timestamp":1761989792353,"version":"3.38.0"},"reference-count":59,"publisher":"Tech Science Press","issue":"2","license":[{"start":{"date-parts":[[2024,11,24]],"date-time":"2024-11-24T00:00:00Z","timestamp":1732406400000},"content-version":"vor","delay-in-days":328,"URL":"https:\/\/doi.org\/10.32604\/TSP-CROSSMARKPOLICY"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["CMC"],"published-print":{"date-parts":[[2024]]},"DOI":"10.32604\/cmc.2024.055787","type":"journal-article","created":{"date-parts":[[2024,10,16]],"date-time":"2024-10-16T06:41:46Z","timestamp":1729060906000},"page":"2493-2515","update-policy":"https:\/\/doi.org\/10.32604\/tsp-crossmarkpolicy","source":"Crossref","is-referenced-by-count":2,"title":["A Recurrent Neural Network for Multimodal Anomaly Detection by Using Spatio-Temporal Audio-Visual Data"],"prefix":"10.32604","volume":"81","author":[{"given":"Sameema","family":"Tariq","sequence":"first","affiliation":[]},{"given":"Ata-Ur-","family":"Rehman","sequence":"additional","affiliation":[]},{"given":"Maria","family":"Abubakar","sequence":"additional","affiliation":[]},{"given":"Waseem","family":"Iqbal","sequence":"additional","affiliation":[]},{"given":"Hatoon S.","family":"Alsagri","sequence":"additional","affiliation":[]},{"given":"Yousef A.","family":"Alduraywish","sequence":"additional","affiliation":[]},{"given":"Haya Abdullah A.","family":"Alhakbani","sequence":"additional","affiliation":[]}],"member":"17807","published-online":{"date-parts":[[2024]]},"reference":[{"key":"ref1","doi-asserted-by":"crossref","unstructured":"H. Lin, J. D. Deng, B. J. Woodford, and A. Shahi, \u201cOnline weighted clustering for real-time abnormal event detection in video surveillance,\u201d presented at the ACM Int. Conf. Multimed., Amsterdam, Netherlands, Oct. 2016, pp. 536\u2013540.","DOI":"10.1145\/2964284.2967279"},{"key":"ref2","doi-asserted-by":"crossref","first-page":"443","DOI":"10.1016\/j.patcog.2015.09.005","article-title":"Combining motion and appearance cues for anomaly detection","volume":"51","author":"Zhang","year":"Jan. 2016","journal-title":"Pattern Recognit."},{"journal-title":"Automated Audio-Visual Activity Analysis","year":"2005","author":"Stauffer","key":"ref3"},{"key":"ref4","doi-asserted-by":"crossref","first-page":"298","DOI":"10.1016\/j.procs.2021.08.031","article-title":"Using deep autoencoders for in-vehicle audio anomaly detection","volume":"192","author":"Pereira","year":"Jan. 2021","journal-title":"Procedia Comput. Sci."},{"key":"ref5","doi-asserted-by":"crossref","unstructured":"M. Pooyan, X. Zhang, M. Hamidi, and J. Zhang, \u201cDeep learning-based anomaly detection for compressors using audio data,\u201d presented at the Annu. Reliabil. Maintainability Symp. (RAMS), Orlando, FL, USA, Jan. 2021, pp. 1\u20137.","DOI":"10.1109\/RAMS48097.2021.9605720"},{"key":"ref6","series-title":"Proc. IEEE Int. Conf. Acoust., Speech, Signal Process. (ICASSP)","first-page":"1996","article-title":"A novel approach for automatic acoustic novelty detection using a denoising autoencoder with bidirectional LSTM neural networks","author":"Marchi","year":"Apr. 2015"},{"key":"ref7","unstructured":"Towards Data Science, \u201cDenoising Autoencoders (DAE): How to use neural networks to cleanup your data,\u201d Towards Data Science. Accessed: May 20, 2022. [Online]. Available: https:\/\/towardsdatascience.com\/denoising-autoencoders-dae-how-to-use-neural-networks-to-cleanup-your-data-cd9c19bc6915"},{"key":"ref8","unstructured":"Towards Data Science, \u201cSparse autoencoder neural networks: How to utilize sparsity for robust information encoding,\u201d Towards Data Science. Accessed: May 20, 2022. [Online]. Available: https:\/\/towardsdatascience.com\/sparse-autoencoder-neural-networks-how-to-utilise-sparsity-for-robust-information-encoding-6aa9ff542bc9"},{"key":"ref9","unstructured":"Keras, \u201cBuilding Autoencoders in Keras,\u201d Keras. Accessed: May 20, 2022. [Online]. Available: https:\/\/blog.keras.io\/building-autoencoders-in-keras.html"},{"key":"ref10","unstructured":"Keras, \u201cVariational Autoencoders (VAE),\u201d Keras. Accessed: May 20, 2022. [Online]. Available: https:\/\/keras.io\/examples\/generative\/vae\/"},{"key":"ref11","doi-asserted-by":"crossref","unstructured":"P. Kumari and M. Saini, \u201cAnomaly detection in audio with concept drift using adaptive Huffman coding,\u201d 2021, arXiv:2102.10515.","DOI":"10.1109\/JSEN.2022.3193969"},{"key":"ref12","doi-asserted-by":"crossref","first-page":"229","DOI":"10.1016\/j.icte.2020.06.003","article-title":"Unsupervised log message anomaly detection","volume":"6","author":"Amir","year":"Sep. 2020","journal-title":"ICT Express"},{"key":"ref13","doi-asserted-by":"crossref","first-page":"41","DOI":"10.1016\/j.engappai.2019.05.011","article-title":"IRESE: An intelligent rare-event detection system using unsupervised learning on the IoT edge","volume":"84","author":"Janjua","year":"Jan. 2019","journal-title":"Eng Appl. Artif. Intell."},{"key":"ref14","doi-asserted-by":"crossref","first-page":"5537","DOI":"10.1007\/s11042-021-11817-9","article-title":"Anomalous sound event detection: A survey of machine learning based methods and applications","volume":"81","author":"Mnasri","year":"Feb. 2022","journal-title":"Multimed. Tools Appl."},{"key":"ref15","unstructured":"Y. Koizumi et al., \u201cDescription and discussion on DCASE2020 challenge task2: Unsupervised anomalous sound detection for machine condition monitoring,\u201d 2020, arXiv:2006.05822."},{"key":"ref16","doi-asserted-by":"crossref","unstructured":"G. Pang, Y. Cheng, C. Shen, A. Van den Hengel, and X. Bai, \u201cSelf-trained deep ordinal regression for end-to-end video anomaly detection,\u201d presented at the IEEE\/CVF Conf. Comput. Vis. Pattern Recognit. (CVPR), Seattle, WA, USA, Jun. 2020, pp. 12173\u201312182.","DOI":"10.1109\/CVPR42600.2020.01219"},{"key":"ref17","doi-asserted-by":"crossref","first-page":"36188","DOI":"10.1109\/ACCESS.2022.3164439","article-title":"An adaptive framework for anomaly detection in time-series audio-visual data","volume":"10","author":"Kumari","year":"Jan. 2022","journal-title":"IEEE Access"},{"key":"ref18","doi-asserted-by":"crossref","unstructured":"R. Morais, V. Le, T. Tran, B. Saha, M. Mansour and S. Venkatesh, \u201cLearning regularity in skeleton trajectories for anomaly detection in videos,\u201d presented at the IEEE Conf. Comput. Vis. Pattern Recognit. (CVPR), Long Beach, CA, USA, Jun. 2019, pp. 11996\u201312004.","DOI":"10.1109\/CVPR.2019.01227"},{"key":"ref19","doi-asserted-by":"crossref","unstructured":"H. -S. Fang, S. Xie, Y. -W. Tai, and C. Lu, \u201cRMPE: Regional multiperson pose estimation,\u201d presented at the IEEE Int. Conf. Comput. Vis. (ICCV), Venice, Italy, Oct. 2017, pp. 2334\u20132343.","DOI":"10.1109\/ICCV.2017.256"},{"key":"ref20","series-title":"Proc. Conf. Empir. Methods in Nat. Lang. Process. (EMNLP)","first-page":"1724","article-title":"Learning phrase representations using RNN encoder-decoder for statistical machine translation","author":"Cho","year":"2014"},{"key":"ref21","first-page":"2293","article-title":"A survey of single-scene video anomaly detection","volume":"44","author":"Ramachandra","year":"May 2020","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"ref22","first-page":"246","article-title":"Sparse coding guided spatiotemporal feature learning for abnormal event detection in large videos","volume":"20","author":"Chu","year":"Jan. 2018","journal-title":"IEEE Trans. Multimed."},{"key":"ref23","doi-asserted-by":"crossref","unstructured":"Y. Cong, J. Yuan, and J. Liu, \u201cSparse reconstruction cost for abnormal event detection,\u201d presented at the IEEE Conf.Comput. Vis. Pattern Recognit. (CVPR), Colorado Springs, CO, USA, Jun. 2011, pp. 3449\u20133456.","DOI":"10.1109\/CVPR.2011.5995434"},{"key":"ref24","doi-asserted-by":"crossref","unstructured":"C. Lu, J. Shi, and J. Jia, \u201cAbnormal event detection at 150 fps in MATLAB,\u201d presented at the IEEE Int. Conf. Comput. Vis. (ICCV), Sydney, Australia, Dec. 2013, pp. 2720\u20132727.","DOI":"10.1109\/ICCV.2013.338"},{"key":"ref25","unstructured":"Y. Lu, C. Cao, and Y. Zhang, \u201cLearnable locality-sensitive hashing for video anomaly detection,\u201d 2021, arXiv:2111.07839."},{"key":"ref26","doi-asserted-by":"crossref","first-page":"187","DOI":"10.1016\/j.patcog.2016.09.016","article-title":"Online growing neural gas for anomaly detection in changing surveillance scenes","volume":"61","author":"Sun","year":"Jan. 2017","journal-title":"Pattern Recognit."},{"key":"ref27","unstructured":"L. Naud and A. Lavin, \u201cManifolds for unsupervised visual anomaly detection,\u201d 2020, arXiv:2006.11364."},{"key":"ref28","doi-asserted-by":"crossref","unstructured":"P. Wu et al., \u201cNot only look, but also listen: Learning multimodal violence detection under weak supervision,\u201d presented at the Eur. Conf. Comput. Vis. (ECCV), Glasgow, UK, Aug. 2020, pp. 322\u2013339.","DOI":"10.1007\/978-3-030-58577-8_20"},{"key":"ref29","doi-asserted-by":"crossref","first-page":"30587","DOI":"10.1109\/ACCESS.2021.3059519","article-title":"Multi-modal anomaly detection by using audio and visual cues","volume":"9","author":"Rehman","year":"Jan. 2021","journal-title":"IEEE Access"},{"key":"ref30","doi-asserted-by":"crossref","first-page":"96","DOI":"10.1109\/MSP.2017.2738401","article-title":"Deep multimodal learning: A survey on recent advances and trends","volume":"34","author":"Ramachandram","year":"Nov. 2017","journal-title":"IEEE Signal Process. Mag."},{"key":"ref31","doi-asserted-by":"crossref","unstructured":"R. Gao, T. -H. Oh, K. Grauman, and L. Torresani, \u201cListen to look: Action recognition by previewing audio,\u201d presented at the IEEE\/CVF Conf. Comput. Vis. Pattern Recognit. (CVPR), Seattle, WA, USA, Jun. 2020, pp. 10457\u201310467.","DOI":"10.1109\/CVPR42600.2020.01047"},{"key":"ref32","doi-asserted-by":"crossref","unstructured":"A. R. Lejb\u00f8lle, B. Krogh, K. Nasrollahi, and T. B. Moeslund, \u201cAttention in multimodal neural networks for person re-identification,\u201d presented at the IEEE Conf. Comput. Vis. Pattern Recognit. Workshops, Salt Lake City, UT, USA, Jun. 2018, pp. 179\u2013187.","DOI":"10.1109\/CVPRW.2018.00055"},{"key":"ref33","article-title":"Deep multi-level fusion network for multi-source image pixel-wise classification","volume":"233","author":"Liu","year":"Jan. 2021, Art. no. 106921","journal-title":"Knowl.-Based Syst."},{"key":"ref34","first-page":"461","article-title":"Deep multiple instance learning-based spatial-spectral classification for PAN and MS imagery","volume":"55","author":"Liu","year":"Sep. 2017","journal-title":"IEEE Trans. Geosci. Remote Sens."},{"key":"ref35","doi-asserted-by":"crossref","first-page":"345","DOI":"10.1007\/s00530-010-0182-0","article-title":"Multimodal fusion for multimedia analysis: A survey","volume":"16","author":"Atrey","year":"Jan. 2010","journal-title":"Multimed. Syst."},{"key":"ref36","unstructured":"K. M. Imran, S. N. Foley, and B. O\u2019Sullivan, \u201cDatabase Intrusion Detection Systems (DIDs): Insider threat detection via behavioural-based anomaly detection systems\u2014A brief survey of concepts and approaches,\u201d 2020, arXiv:2011.02308."},{"key":"ref37","doi-asserted-by":"crossref","first-page":"698","DOI":"10.1109\/LSP.2004.831663","article-title":"Generalization of spectral flatness measure for non-gaussian linear processes","volume":"11","author":"Dubnov","year":"Dec. 2004","journal-title":"IEEE Signal Process. Lett."},{"key":"ref38","doi-asserted-by":"crossref","DOI":"10.1016\/j.apacoust.2019.107020","article-title":"Trends in audio signal feature extraction methods","volume":"158","author":"Sharma","year":"Jan. 2020, Art. no. 107020","journal-title":"Appl. Acoust."},{"key":"ref39","unstructured":"Analytics India Magazine, \u201cA tutorial on spectral feature extraction for audio analytics,\u201d Analytics India Magazine. Accessed: Dec. 20, 2021. [Online]. Available: https:\/\/analyticsindiamag.com\/a-tutorial-on-spectral-feature-extraction-for-audio-analytics\/"},{"key":"ref40","unstructured":"Analytics India Magazine, \u201cHands-on guide to implement batch normalization in deep learning models,\u201d Accessed: Jun. 13, 2021. [Online]. Available: https:\/\/analyticsindiamag.com\/hands-on-guide-to-implement-batch-normalization-in-deep-learning-models\/"},{"key":"ref41","unstructured":"Analytics India Magazine, \u201cConvolutional layer,\u201d Accessed: Jun. 12, 2021. [Online]. Available: https:\/\/databricks.com\/glossary\/convolutional-layer"},{"key":"ref42","unstructured":"M. L. Value, \u201cTime distributed layer in Keras with example in Python,\u201d Accessed: Jun. 13, 2021. [Online]. Available: https:\/\/valueml.com\/time-distributed-layer-in-keras-with-example-in-python\/"},{"key":"ref43","doi-asserted-by":"crossref","unstructured":"M. Hasan, J. Choi, J. Neumann, A. K. Roy Chowdhury, and L. S. Davis, \u201cLearning temporal regularity in video sequences,\u201d presented at the IEEE Conf. Comput. Vis. Pattern Recognit. (CVPR), Las Vegas, NV, USA, Jun. 2016, pp. 733\u2013742.","DOI":"10.1109\/CVPR.2016.86"},{"key":"ref44","unstructured":"Towards Data Science, \u201cPrototyping an anomaly detection system for videos: Step-by-step using LSTM & convolutional,\u201d Towards Data Science. Accessed: Jun. 10, 2022. [Online]. Available: https:\/\/towardsdatascience.com\/prototyping-an-anomaly-detection-system-for-videos-step-by-step-using-lstm-convolutional-4e06b7dcdd29"},{"key":"ref45","unstructured":"Github, \u201cUCSD-UMN anomalous audio datasets,\u201d Accessed: Aug. 05, 2022. [Online]. Available: https:\/\/github.com\/tsameema\/UCSD-UMN-Anomalous_Audio-Datasets"},{"key":"ref46","unstructured":"DCASE, \u201cTask 1: Rare sound event detection,\u201d Accessed: Jul. 24, 2021. [Online]. Available: https:\/\/dcase.community\/challenge2017\/taskrare-sound-event-detection"},{"key":"ref47","series-title":"Proc. IEEE Comput. Soc. Conf. Comput. Vis. Pattern Recognit. (CVPR)","first-page":"1975","article-title":"Anomaly detection in crowded scenes","author":"Mahadevan","year":"2010"},{"key":"ref48","unstructured":"Machine Learning Mastery, \u201cHow to choose loss functions when training deep learning neural networks,\u201d Machine Learning Mastery. Accessed: Jan. 13, 2022. [Online]. Available: https:\/\/machinelearningmastery.com\/how-to-choose-loss-functions-when-training-deep-learningneural-networks\/"},{"key":"ref49","unstructured":"Analytics Vidhya, \u201cBinary cross-entropy (Log Loss) for binary classification,\u201d  Analytics Vidhya. Accessed: Jan. 13, 2022. [Online]. Available: https:\/\/www.analyticsvidhya.com\/blog\/2021\/03\/binary-cross-entropy-log-loss-for-binary-classification\/"},{"key":"ref50","unstructured":"Analytics Vidhya, \u201cA comprehensive guide on deep learning optimizers,\u201d Analytics Vidhya. Accessed: Jan. 20, 2022. [Online]. Available: https:\/\/www.analyticsvidhya.com\/blog\/2021\/10\/a-comprehensive-guide-on-deep-learning-optimizers\/"},{"key":"ref51","unstructured":"Towards Data Science, \u201cAdam: Latest trends in deep learning optimization,\u201d Towards Data Science. Accessed: Jan. 20, 2022. [Online]. Available: https:\/\/towardsdatascience.com\/adam-latest-trends-in-deep-learning-optimization-6be9a291375c"},{"key":"ref52","doi-asserted-by":"crossref","unstructured":"N. Rashmiranjan, U. C. Pati, and S. K. Das, \u201cVideo anomaly detection using convolutional spatiotemporal autoencoder,\u201d presented at the Int. Conf. Contemp. Comput. Appl. (IC3A), Patna, India, Feb. 2020, pp. 175\u2013180.","DOI":"10.1109\/IC3A48958.2020.233292"},{"key":"ref53","doi-asserted-by":"crossref","DOI":"10.1155\/2021\/7367870","article-title":"Anomaly detection in videos using two-stream autoencoder with post hoc interpretability","volume":"2021","author":"Feng","year":"2021, Art. no. 7367870","journal-title":"Comput. Intell. Neurosci."},{"key":"ref54","doi-asserted-by":"crossref","unstructured":"W. Tian, Z. Miao, Y. Chen, Y. Zhou, G. Shan and H. Snoussi, \u201cAED-Net: An abnormal event detection network,\u201d presented at the Eng. Conf., Nanjing, China, Sep. 2019, pp. 930\u2013939.","DOI":"10.1016\/j.eng.2019.02.008"},{"key":"ref55","article-title":"Towards zero shot learning of geometry of motion streams and its application to anomaly recognition","volume":"186","author":"Buckchash","year":"Sep. 2021, Art. no. 114916","journal-title":"Expert. Syst. Appl."},{"key":"ref56","doi-asserted-by":"crossref","first-page":"3463","DOI":"10.1109\/TIP.2017.2695105","article-title":"Video anomaly detection with compact feature sets for online performance","volume":"26","author":"Leyva","year":"Jul. 2017","journal-title":"IEEE Trans. Image Process"},{"key":"ref57","doi-asserted-by":"crossref","DOI":"10.1016\/j.eswa.2021.116394","article-title":"A novel framework for detection of motion and appearance-based anomaly using ensemble learning and LSTMs","volume":"192","author":"Sabih","year":"Jan. 2022","journal-title":"Expert Syst. Appl."},{"key":"ref58","unstructured":"M. R. Parate, K. M. Bhurchandi, and A. G. Kothari, \u201cAnomaly detection in residential video surveillance on edge devices in IoT framework,\u201d 2021, arXiv:2107.04767."},{"key":"ref59","unstructured":"Monitoring human activity, Accessed: Jul. 24, 2021. [Online]. Available: http:\/\/mha.cs.umn.edu\/proj_events.shtml"}],"container-title":["Computers, Materials &amp; Continua"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.techscience.com\/files\/cmc\/2024\/TSP_CMC-81-2\/TSP_CMC_55787\/TSP_CMC_55787.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,3,7]],"date-time":"2025-03-07T04:11:30Z","timestamp":1741320690000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.techscience.com\/cmc\/v81n2\/58645"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024]]},"references-count":59,"journal-issue":{"issue":"2","published-online":{"date-parts":[[2024]]},"published-print":{"date-parts":[[2024]]}},"URL":"https:\/\/doi.org\/10.32604\/cmc.2024.055787","relation":{},"ISSN":["1546-2226"],"issn-type":[{"type":"electronic","value":"1546-2226"}],"subject":[],"published":{"date-parts":[[2024]]},"assertion":[{"value":"2024-07-07","order":0,"name":"received","label":"Received","group":{"name":"publication_history","label":"Publication History"}},{"value":"2024-09-19","order":1,"name":"accepted","label":"Accepted","group":{"name":"publication_history","label":"Publication History"}},{"value":"2024-11-18","order":2,"name":"published","label":"Published Online","group":{"name":"publication_history","label":"Publication History"}}]}}