{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,5,2]],"date-time":"2025-05-02T22:10:10Z","timestamp":1746223810889,"version":"3.40.4"},"publisher-location":"Cham","reference-count":50,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319056951"},{"type":"electronic","value":"9783319056968"}],"license":[{"start":{"date-parts":[[2014,1,1]],"date-time":"2014-01-01T00:00:00Z","timestamp":1388534400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2014,1,1]],"date-time":"2014-01-01T00:00:00Z","timestamp":1388534400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014]]},"DOI":"10.1007\/978-3-319-05696-8_7","type":"book-chapter","created":{"date-parts":[[2014,5,9]],"date-time":"2014-05-09T14:19:39Z","timestamp":1399645179000},"page":"161-184","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":5,"title":["Multimodal Fusion in Surveillance Applications"],"prefix":"10.1007","author":[{"given":"Virginia","family":"Fernandez Arguedas","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Qianni","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ebroul","family":"Izquierdo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2014,3,26]]},"reference":[{"key":"7_CR1","unstructured":"Aghajan H, Cavallaro A (2009) Multi-camera networks: principles and applications. Academic Press, London"},{"key":"7_CR2","doi-asserted-by":"crossref","unstructured":"Argillander J, Iyengar G, Nock H (2005) Semantic annotation of multimedia using maximum entropy models. In: IEEE international conference on acoustics, speech, and signal processing, vol 2. pp 153\u2013156","DOI":"10.1109\/ICASSP.2005.1415364"},{"key":"7_CR3","doi-asserted-by":"crossref","unstructured":"Arsic D, Schuller B, Rigoll G (2007) Suspicious behavior detection in public transport by fusion of low-level video descriptors. In: IEEE international conference on multimedia and expo, pp 2018\u20132021","DOI":"10.1109\/ICME.2007.4285076"},{"key":"7_CR4","doi-asserted-by":"publisher","first-page":"155","DOI":"10.1007\/978-3-540-69429-8_16","volume":"4352","author":"P Atrey","year":"2006","unstructured":"Atrey P, Kankanhalli M, El Saddik A (2006) Confidence building among correlated streams in multimedia surveillance systems. Adv Multimedia Model 4352:155\u2013164","journal-title":"Adv Multimedia Model"},{"issue":"6","key":"7_CR5","doi-asserted-by":"publisher","first-page":"345","DOI":"10.1007\/s00530-010-0182-0","volume":"16","author":"PK Atrey","year":"2010","unstructured":"Atrey PK, Hossain MA, El Saddik A, Kankanhalli MS (2010) Multimodal fusion for multimedia analysis: a survey. Multimedia Syst 16(6):345\u2013379","journal-title":"Multimedia Syst"},{"issue":"3","key":"7_CR6","doi-asserted-by":"publisher","first-page":"239","DOI":"10.1007\/s00530-006-0063-8","volume":"12","author":"PK Atrey","year":"2006","unstructured":"Atrey PK, Kankanhalli MS, Jain R (2006) Information assimilation framework for event detection in multimedia surveillance systems. Multimedia syst 12(3):239\u2013253","journal-title":"Multimedia syst"},{"key":"7_CR7","doi-asserted-by":"crossref","unstructured":"Bahlmann C, Pellkofer M, Giebel J, Baratoff G (2008) Multi-modal speed limit assistants: Combining camera and gps maps. In: IEEE intelligent vehicles symposium, pp 132\u2013137","DOI":"10.1109\/IVS.2008.4621215"},{"key":"7_CR8","doi-asserted-by":"crossref","unstructured":"Bahlmann C, Zhu Y, Ramesh V, Pellkofer M, Koehler T (2005) A system for traffic sign detection, tracking, and recognition using color, shape, and motion information. In: IEEE intelligent vehicles symposium, pp 255\u2013260","DOI":"10.1109\/IVS.2005.1505111"},{"key":"7_CR9","unstructured":"Brooks RR, Iyengar SS (1998) Multi-sensor fusion: fundamentals and applications with software. Prentice-Hall Inc, Upper Saddle River"},{"issue":"1\u20132","key":"7_CR10","doi-asserted-by":"publisher","first-page":"431","DOI":"10.1016\/0004-3702(95)00041-0","volume":"78","author":"H Buxton","year":"1995","unstructured":"Buxton H, Gong S (1995) Visual surveillance in a dynamic and uncertain world. Artif Intell 78(1\u20132):431\u2013459","journal-title":"Artif Intell"},{"issue":"4","key":"7_CR11","doi-asserted-by":"crossref","first-page":"2152","DOI":"10.1109\/TIP.2011.2172798","volume":"21","author":"HY Cheng","year":"2012","unstructured":"Cheng HY, Weng CC, Chen YY (2012) Vehicle detection in aerial surveillance using dynamic bayesian networks. IEEE Trans Image Process 21(4):2152\u20132159","journal-title":"IEEE Trans Image Process"},{"key":"7_CR12","doi-asserted-by":"crossref","unstructured":"Csurka G, Clinchant S. An empirical study of fusion operators for multimodal image retrieval. In: 10th international workshop on content-based multimedia indexing, IEEE, pp 1\u20136","DOI":"10.1109\/CBMI.2012.6269843"},{"key":"7_CR13","doi-asserted-by":"crossref","unstructured":"Dore A, Pinasco M, Regazzoni C (2009) Multi-modal data fusion techniques and applications. In: Multi-camera networks, pp 213\u2013237","DOI":"10.1016\/B978-0-12-374633-7.00011-2"},{"issue":"4","key":"7_CR14","doi-asserted-by":"publisher","first-page":"1456","DOI":"10.1109\/TCE.2007.4429237","volume":"53","author":"D Drajic","year":"2007","unstructured":"Drajic D, Cvejic N (2007) Adaptive fusion of multimodal surveillance image sequences in visual sensor networks. IEEE Trans Consum Electron 53(4):1456\u20131462","journal-title":"IEEE Trans Consum Electron"},{"issue":"12","key":"7_CR15","doi-asserted-by":"publisher","first-page":"952","DOI":"10.1109\/LSP.2007.908035","volume":"14","author":"Y Du","year":"2007","unstructured":"Du Y, Chen F, Xu W (2007) Human interaction representation and recognition through motion decomposition. IEEE Sig Process Lett 14(12):952\u2013955","journal-title":"IEEE Sig Process Lett"},{"key":"7_CR16","doi-asserted-by":"crossref","unstructured":"Fernandez Arguedas V, Izquierdo E (2011) Object classification based on behaviour patterns. In: International conference on imaging for crime detection and prevention","DOI":"10.1049\/ic.2011.0112"},{"key":"7_CR17","unstructured":"Fernandez Arguedas V, Zhang Q, Chandramouli K, Izquierdo E (2011) Multi-feature fusion for surveillance video indexing. In: International workshop on image analysis for multimedia interactive services, IEEE"},{"key":"7_CR18","doi-asserted-by":"crossref","unstructured":"Fernandez Arguedas V, Zhang Q, Chandramouli K, Izquierdo E (2012) Semantic hyper\/multi media adaptation, chapter Vision based semantic analysis of surveillance videos. Springer, Berlin, pp 83\u2013126","DOI":"10.1007\/978-3-642-28977-4_3"},{"key":"7_CR19","doi-asserted-by":"crossref","unstructured":"Fernandez Arguedas V, Zhang Q, Izquierdo E (2012) Bayesian multimodal fusion in forensic applications. In: Computer vision-ECCV 2012, workshops and demonstrations. Springer, pp 466\u2013475","DOI":"10.1007\/978-3-642-33885-4_47"},{"key":"7_CR20","doi-asserted-by":"crossref","unstructured":"Gupta H, Yu L, Hakeem A, Eun Choe T, Haering N, Locasto M (2011) Multimodal complex event detection framework for wide area surveillance. In: IEEE computer society conference on computer vision and pattern recognition workshops, pp 47\u201354","DOI":"10.1109\/CVPRW.2011.5981746"},{"key":"7_CR21","unstructured":"Huang T, Koller D, Malik J, Ogasawara G, Rao B, Russell S, Weber J (1995) Automatic symbolic traffic scene analysis using belief networks. In: Proceedings of the national conference on artificial intelligence. Wiley, pp 966\u2013966"},{"issue":"1","key":"7_CR22","doi-asserted-by":"publisher","first-page":"511","DOI":"10.1016\/j.eswa.2010.06.093","volume":"38","author":"SF Jiang","year":"2011","unstructured":"Jiang SF, Zhang CM, Zhang S (2011) Two-stage structural damage detection using fuzzy neural networks and data fusion techniques. Expert Syst Appl 38(1):511\u2013519","journal-title":"Expert Syst Appl"},{"issue":"2","key":"7_CR23","doi-asserted-by":"publisher","first-page":"201","DOI":"10.3758\/BF03212378","volume":"14","author":"G Johansson","year":"1973","unstructured":"Johansson G (1973) Visual perception of biological motion and a model for its analysis. Attention Percept Psychophys 14(2):201\u2013211","journal-title":"Attention Percept Psychophys"},{"issue":"1","key":"7_CR24","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s11760-008-0099-7","volume":"4","author":"IN Junejo","year":"2010","unstructured":"Junejo IN (2010) Using dynamic bayesian network for scene modeling and anomaly detection. Sig Image Video Process 4(1):1\u201310","journal-title":"Sig Image Video Process"},{"key":"7_CR25","doi-asserted-by":"crossref","unstructured":"Klausner A, Tengg A, Rinner B (2007) Vehicle classification on multi-sensor smart cameras using feature-and decision-fusion. In: ACM\/IEEE international conference on distributed smart cameras, pp 67\u201374","DOI":"10.1109\/ICDSC.2007.4357507"},{"issue":"2","key":"7_CR26","doi-asserted-by":"publisher","first-page":"166","DOI":"10.1016\/j.imavis.2005.09.024","volume":"24","author":"X Liu","year":"2006","unstructured":"Liu X, Chua CS (2006) Multi-agent activity recognition using observation decomposedhidden markov models. Image Vis Comput 24(2):166\u2013175","journal-title":"Image Vis Comput"},{"issue":"2","key":"7_CR27","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1109\/JSEN.2002.1000251","volume":"2","author":"RC Luo","year":"2002","unstructured":"Luo RC, Yih CC, Su KL (2002) Multisensor fusion and integration: approaches, applications, and future research directions. IEEE Sens J 2(2):107\u2013119","journal-title":"IEEE Sens J"},{"key":"7_CR28","doi-asserted-by":"crossref","unstructured":"Ma J, Liu W, Miller P (2012) An evidential improvement for gender profiling. In: Denoeux\u00a0T, Masson M-H (eds) Belief functions: theory and applications, volume 164 of advances in intelligent and soft computing. Springer, Berlin\/Heidelberg, pp 29\u201336","DOI":"10.1007\/978-3-642-29461-7_3"},{"key":"7_CR29","doi-asserted-by":"crossref","unstructured":"Magalh\u00e3es J, R\u00fcger S (2007) Information-theoretic semantic multimedia indexing. In: ACM international conference on image and video retrieval, pp 619\u2013626","DOI":"10.1145\/1282280.1282368"},{"issue":"1","key":"7_CR30","doi-asserted-by":"publisher","first-page":"67","DOI":"10.1016\/j.conengprac.2004.02.005","volume":"13","author":"N Messai","year":"2005","unstructured":"Messai N, Thomas P, Lefebvre D, Moudni AE (2005) Neural networks for local monitoring of traffic magnetic sensors. Control Eng Pract 13(1):67\u201380","journal-title":"Control Eng Pract"},{"key":"7_CR31","first-page":"1","volume":"99","author":"M Meuter","year":"2011","unstructured":"Meuter M, Nunn C, G\u00f6rmer SM, M\u00fcller-Schneiders S, Kummert A (2011) A decision fusion and reasoning module for a traffic sign recognition system. IEEE Trans Intell Transp Sys 99:1\u20139","journal-title":"IEEE Trans Intell Transp Sys"},{"key":"7_CR32","doi-asserted-by":"crossref","unstructured":"Mironica I, Ionescu B, Knees P, Lambert P (2013) An in-depth evaluation of multimodal video genre categorization. In: 11th International workshop on content-based multimedia indexing, pp 11\u201316","DOI":"10.1109\/CBMI.2013.6576545"},{"key":"7_CR33","doi-asserted-by":"crossref","unstructured":"Moore DJ, Essa IA, Hayes MH III (1999) Exploiting human actions and object context for recognition tasks. In: IEEE international conference on computer vision, vol 1. pp 80\u201386","DOI":"10.1109\/ICCV.1999.791201"},{"key":"7_CR34","doi-asserted-by":"crossref","unstructured":"Nayak J, Gonzalez-Argueta L, Song B, Roy-Chowdhury A, Tuncel E (2008) Multi-target tracking through opportunistic camera control in a resource constrained multimodal sensor network. In: Second ACM\/IEEE international conference on distributed smart cameras, ICDSC 2008, pp 1\u201310","DOI":"10.1109\/ICDSC.2008.4635682"},{"key":"7_CR35","doi-asserted-by":"crossref","unstructured":"Nirmala DE, Paul BS, Vaidehi V (2011) A novel multimodal image fusion method using shift invariant discrete wavelet transform and support vector machines. In: International conference on recent trends in information technology, pp 932\u2013937","DOI":"10.1109\/ICRTIT.2011.5972405"},{"issue":"8","key":"7_CR36","doi-asserted-by":"publisher","first-page":"831","DOI":"10.1109\/34.868684","volume":"22","author":"NM Oliver","year":"2000","unstructured":"Oliver NM, Rosario B, Pentland AP (2000) A bayesian computer vision system for modeling human interactions. IEEE Trans Pattern Anal Mach Intell 22(8):831\u2013843","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"issue":"3","key":"7_CR37","first-page":"187","volume":"14","author":"C Ozkurt","year":"2010","unstructured":"Ozkurt C, Camci F (2010) Automatic traffic density estimation and vehicle classification for traffic surveillance systems using neural networks. Math Comput Appl 14(3):187","journal-title":"Math Comput Appl"},{"key":"7_CR38","doi-asserted-by":"crossref","unstructured":"Prati A, Vezzani R, Benini L, Farella E, Zappi P (2005) An integrated multi-modal sensor network for video surveillance. In: ACM international workshop on video surveillance and sensor networks, pp 95\u2013102","DOI":"10.1145\/1099396.1099415"},{"key":"7_CR39","unstructured":"Rashidi A, Ghassemian H (2003) Extended dempster-shafer theory for multi-system\/sensor decision fusion. In: Joint workshop on challenges in geospatial analysis, integration and visualization II, pp 31\u201337"},{"key":"7_CR40","doi-asserted-by":"crossref","unstructured":"Remagnino P, Tan T, Baker K (1998) Agent orientated annotation in model based visual surveillance. In: International conference on computer vision, pp 857\u2013862","DOI":"10.1109\/ICCV.1998.710817"},{"key":"7_CR41","doi-asserted-by":"crossref","unstructured":"Snidaro L, Visentini I, Foresti G (2011) Data fusion in modern surveillance. In: Innovations in defence support systems-3, pp 1\u201321","DOI":"10.1007\/978-3-642-18278-5_1"},{"key":"7_CR42","doi-asserted-by":"crossref","unstructured":"Snoek CGM, Worring M, Smeulders AWM (2005) Early versus late fusion in semantic video analysis. In: ACM international conference on multimedia","DOI":"10.1145\/1101149.1101236"},{"issue":"7","key":"7_CR43","doi-asserted-by":"crossref","first-page":"932","DOI":"10.1109\/TCSVT.2011.2133570","volume":"21","author":"HI Suk","year":"2011","unstructured":"Suk HI, Jain AK, Lee SW (2011) A network of dynamic probabilistic models for human interaction analysis. IEEE Trans Circ Syst Video Technol 21(7):932\u2013945","journal-title":"IEEE Trans Circ Syst Video Technol"},{"issue":"11","key":"7_CR44","doi-asserted-by":"crossref","first-page":"1473","DOI":"10.1109\/TCSVT.2008.2005594","volume":"18","author":"P Turaga","year":"2008","unstructured":"Turaga P, Chellappa R, Subrahmanian VS, Udrea O (2008) Machine recognition of human activities: a survey. IEEE Trans Circ Sys Video Technol 18(11):1473\u20131488","journal-title":"IEEE Trans Circ Sys Video Technol"},{"key":"7_CR45","doi-asserted-by":"crossref","unstructured":"Vanajakshi L, Rilett LR (2004) A comparison of the performance of artificial neural networks and support vector machines for the prediction of traffic speed. In: IEEE intelligent vehicles symposium, pp 194\u2013199","DOI":"10.1109\/IVS.2004.1336380"},{"issue":"3","key":"7_CR46","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1016\/j.trc.2005.04.007","volume":"13","author":"EI Vlahogianni","year":"2005","unstructured":"Vlahogianni EI, Karlaftis MG, Golias JC (2005) Optimized and meta-optimized neural networks for short-term traffic flow prediction: a genetic approach. Transp Res Part C Emerg Technol 13(3):211\u2013234","journal-title":"Transp Res Part C Emerg Technol"},{"key":"7_CR47","doi-asserted-by":"crossref","unstructured":"Wu Z, Cai L, Meng H (2006) Multi-level fusion of audio and visual features for speaker identification. In: International conference on advances in biometrics, pp 493\u2013499","DOI":"10.1007\/11608288_66"},{"key":"7_CR48","unstructured":"Xiao JM, Wang XH (2004) Study on traffic flow prediction using rbf neural network. In: International conference on machine learning and cybernetics, vol 5. pp 2672\u20132675"},{"key":"7_CR49","doi-asserted-by":"crossref","unstructured":"Zhang Q, Izquierdo E (2007) Combining low-level features for semantic inference in image retrieval. In: EURASIP journal on advances in signal processing, p 12","DOI":"10.1155\/2007\/61423"},{"key":"7_CR50","unstructured":"Zou X, Bhanu B (2005) Tracking humans using multi-modal fusion. In: IEEE computer society conference on computer vision and pattern recognition, pp 4\u20134"}],"container-title":["Advances in Computer Vision and Pattern Recognition","Fusion in Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-05696-8_7","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,2]],"date-time":"2025-05-02T21:28:33Z","timestamp":1746221313000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-319-05696-8_7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014]]},"ISBN":["9783319056951","9783319056968"],"references-count":50,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-05696-8_7","relation":{},"ISSN":["2191-6586","2191-6594"],"issn-type":[{"type":"print","value":"2191-6586"},{"type":"electronic","value":"2191-6594"}],"subject":[],"published":{"date-parts":[[2014]]},"assertion":[{"value":"26 March 2014","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}}]}}