{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,29]],"date-time":"2026-03-29T10:00:50Z","timestamp":1774778450778,"version":"3.50.1"},"reference-count":81,"publisher":"Elsevier","isbn-type":[{"value":"9780128092767","type":"print"}],"license":[{"start":{"date-parts":[[2017,1,1]],"date-time":"2017-01-01T00:00:00Z","timestamp":1483228800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2017]]},"DOI":"10.1016\/b978-0-12-809276-7.00011-4","type":"book-chapter","created":{"date-parts":[[2017,4,21]],"date-time":"2017-04-21T16:30:32Z","timestamp":1492792232000},"page":"183-207","source":"Crossref","is-referenced-by-count":37,"title":["Learning to Predict Human Behavior in Crowded Scenes"],"prefix":"10.1016","author":[{"given":"Alexandre","family":"Alahi","sequence":"first","affiliation":[]},{"given":"Vignesh","family":"Ramanathan","sequence":"additional","affiliation":[]},{"given":"Kratarth","family":"Goel","sequence":"additional","affiliation":[]},{"given":"Alexandre","family":"Robicquet","sequence":"additional","affiliation":[]},{"given":"Amir A.","family":"Sadeghian","sequence":"additional","affiliation":[]},{"given":"Li","family":"Fei-Fei","sequence":"additional","affiliation":[]},{"given":"Silvio","family":"Savarese","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0005","doi-asserted-by":"publisher","first-page":"1018","DOI":"10.1126\/science.1177170","article-title":"Limits of predictability in human mobility","author":"Song","year":"2010","journal-title":"Science"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0010","series-title":"ECCV","article-title":"Activity forecasting","author":"Kitani","year":"2012"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0015","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevE.51.4282","article-title":"Social force model for pedestrian dynamics","author":"Helbing","year":"1995","journal-title":"Phys Rev E"},{"issue":"4","key":"10.1016\/B978-0-12-809276-7.00011-4_br0020","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0010047","article-title":"The walking behaviour of pedestrian social groups and its impact on crowd dynamics","volume":"5","author":"Moussa\u00efd","year":"2010","journal-title":"PLoS ONE"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0025","series-title":"ICRA","first-page":"464","article-title":"People tracking with human motion predictions from social forces","author":"Luber","year":"2010"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0030","series-title":"IEEE conference on computer vision and pattern recognition","first-page":"935","article-title":"Abnormal crowd behavior detection using social force model","author":"Mehran","year":"2009"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0035","author":"Graves"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0040","series-title":"Social intelligence: the new science of success","author":"Albrecht","year":"2006"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0045","series-title":"Proceedings of the 31st international conference on machine learning (ICML-14)","first-page":"1764","article-title":"Towards end-to-end speech recognition with recurrent neural networks","author":"Graves","year":"2014"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0050","series-title":"ICCV","article-title":"You'll never walk alone: modeling social behavior for multi-target tracking","author":"Pellegrini","year":"2009"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0055","doi-asserted-by":"publisher","first-page":"655","DOI":"10.1111\/j.1467-8659.2007.01089.x","article-title":"Crowds by example","volume":"26","author":"Lerner","year":"2007","journal-title":"Comput Graph Forum"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0060","series-title":"CVPR","article-title":"Who are you with and where are you going?","author":"Yamaguchi","year":"2011"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0065","series-title":"ECCV","article-title":"Improving data association by joint modeling of pedestrian trajectories and groupings","author":"Pellegrini","year":"2010"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0070","series-title":"ICCV workshops","article-title":"Everybody needs somebody: modeling social and grouping behavior on a linear programming multiple people tracker","author":"Leal-Taixe","year":"2011"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0075","series-title":"CVPR","first-page":"3542","article-title":"Learning an image-based motion context for multiple people tracking","author":"Leal-Taix\u00e9","year":"2014"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0080","series-title":"Computer vision \u2013 ECCV 2012","first-page":"215","article-title":"A unified framework for multi-target tracking and collective activity recognition","author":"Choi","year":"2012"},{"issue":"6","key":"10.1016\/B978-0-12-809276-7.00011-4_br0085","doi-asserted-by":"publisher","first-page":"1242","DOI":"10.1109\/TPAMI.2013.220","article-title":"Understanding collective activities of people from videos","volume":"36","author":"Choi","year":"2014","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0090","doi-asserted-by":"publisher","first-page":"1160","DOI":"10.1145\/1141911.1142008","article-title":"Continuum crowds","volume":"25","author":"Treuille","year":"2006","journal-title":"ACM Trans Graph"},{"issue":"8","key":"10.1016\/B978-0-12-809276-7.00011-4_br0095","doi-asserted-by":"publisher","first-page":"667","DOI":"10.1016\/j.trb.2005.09.006","article-title":"Discrete choice models of pedestrian walking behavior","volume":"40","author":"Antonini","year":"2006","journal-title":"Transp Res, Part B, Methodol"},{"issue":"2","key":"10.1016\/B978-0-12-809276-7.00011-4_br0100","doi-asserted-by":"publisher","first-page":"283","DOI":"10.1109\/TPAMI.2007.1167","article-title":"Gaussian process dynamical models for human motion","volume":"30","author":"Wang","year":"2008","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0105","series-title":"Field and service robotics","first-page":"381","article-title":"Modelling smooth paths using Gaussian processes","author":"Tay","year":"2008"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0110","series-title":"Proceedings of the IEEE conference on computer vision and pattern recognition","first-page":"3488","article-title":"Understanding pedestrian behaviors from stationary crowd groups","author":"Yi","year":"2015"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0115","series-title":"ICCV","article-title":"Social saliency prediction","author":"Park","year":"2015"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0120","series-title":"CVPR","article-title":"Socially-aware large-scale crowd forecasting","author":"Alahi","year":"2014"},{"issue":"Suppl. 3","key":"10.1016\/B978-0-12-809276-7.00011-4_br0125","doi-asserted-by":"publisher","first-page":"7280","DOI":"10.1073\/pnas.082080899","article-title":"Agent-based modeling: methods and techniques for simulating human systems","volume":"99","author":"Bonabeau","year":"2002","journal-title":"Proc Natl Acad Sci USA"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0130","series-title":"2011 IEEE international conference on computer vision (ICCV)","first-page":"1235","article-title":"Data-driven crowd analysis in videos","author":"Rodriguez","year":"2011"},{"issue":"4","key":"10.1016\/B978-0-12-809276-7.00011-4_br0135","doi-asserted-by":"publisher","first-page":"1168","DOI":"10.1109\/TIP.2006.891352","article-title":"Semantic-based surveillance video retrieval","volume":"16","author":"Hu","year":"2007","journal-title":"IEEE Trans Image Process"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0140","series-title":"2011 IEEE international conference on computer vision (ICCV)","first-page":"1164","article-title":"Gaussian process regression flow for analysis of motion trajectories","author":"Kim","year":"2011"},{"issue":"11","key":"10.1016\/B978-0-12-809276-7.00011-4_br0145","doi-asserted-by":"publisher","first-page":"2287","DOI":"10.1109\/TPAMI.2011.64","article-title":"Trajectory learning for activity understanding: unsupervised, multilevel, and long-term adaptive approach","volume":"33","author":"Morris","year":"2011","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0150","series-title":"2011 IEEE conference on computer vision and pattern recognition (CVPR)","first-page":"3441","article-title":"Random field topic model for semantic region analysis in crowded scenes from tracklets","author":"Zhou","year":"2011"},{"issue":"8","key":"10.1016\/B978-0-12-809276-7.00011-4_br0155","doi-asserted-by":"publisher","first-page":"1114","DOI":"10.1109\/TCSVT.2008.927109","article-title":"A survey of vision-based trajectory learning and analysis for surveillance","volume":"18","author":"Morris","year":"2008","journal-title":"IEEE Trans Circuits Syst Video Technol"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0160","author":"Pirsiavash"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0165","series-title":"Computer vision \u2013 ECCV 2014","first-page":"618","article-title":"Context-based pedestrian path prediction","author":"Kooij","year":"2014"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0170","series-title":"2014 international joint conference on neural networks (IJCNN)","first-page":"1494","article-title":"A predictive model for recognizing human behaviour based on trajectory representation","author":"Azorin-Lopez","year":"2014"},{"issue":"4","key":"10.1016\/B978-0-12-809276-7.00011-4_br0175","doi-asserted-by":"publisher","first-page":"591","DOI":"10.1016\/j.robot.2014.01.003","article-title":"Learning intentions for improved human motion prediction","volume":"62","author":"Elfring","year":"2014","journal-title":"Robot Auton Syst"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0180","series-title":"Computer vision \u2013 ECCV 2014","first-page":"596","article-title":"A discriminative model with multiple temporal scales for action prediction","author":"Kong","year":"2014"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0185","series-title":"Computer vision \u2013 ECCV 2012","first-page":"201","article-title":"Activity forecasting","author":"Kitani","year":"2012"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0190","series-title":"CVPR","article-title":"Patch to the future: unsupervised visual prediction","author":"Walker","year":"2014"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0195","series-title":"IEEE\/RSJ international conference on intelligent robots and systems","first-page":"3931","article-title":"Planning-based prediction for pedestrians","author":"Ziebart","year":"2009"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0200","series-title":"2013 13th IEEE\u2013RAS international conference on humanoid robots (Humanoids)","first-page":"499","article-title":"Probabilistic human action prediction and wait-sensitive planning for responsive human\u2013robot collaboration","author":"Hawkins","year":"2013"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0205","series-title":"ECCV","article-title":"Unsupervised learning of functional categories in video scenes","author":"Turek","year":"2010"},{"issue":"8","key":"10.1016\/B978-0-12-809276-7.00011-4_br0210","doi-asserted-by":"publisher","first-page":"1644","DOI":"10.1109\/TPAMI.2013.2297321","article-title":"Prediction of human activity by discovering temporal sequence patterns","volume":"36","author":"Li","year":"2014","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0215","series-title":"ECCV","article-title":"Robust object tracking by hierarchical association of detection responses","author":"Huang","year":"2008"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0220","series-title":"Proceedings of the 2011 international conference on computer vision","first-page":"619","article-title":"Multi-hypothesis motion planning for visual object tracking","author":"Gong","year":"2011"},{"issue":"3","key":"10.1016\/B978-0-12-809276-7.00011-4_br0225","doi-asserted-by":"publisher","first-page":"397","DOI":"10.1109\/TSMCB.2005.846652","article-title":"Learning semantic scene models from observing activity in visual surveillance","volume":"35","author":"Makris","year":"2005","journal-title":"IEEE Trans Syst Man Cybern, Part B, Cybern"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0230","series-title":"2014 IEEE international conference on robotics and automation (ICRA)","first-page":"4015","article-title":"Learning to predict trajectories of cooperatively navigating agents","author":"Kretzschmar","year":"2014"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0235","series-title":"2014 IEEE conference on computer vision and pattern recognition (CVPR)","first-page":"2027","article-title":"Predicting object dynamics in scenes","author":"Fouhey","year":"2014"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0240","series-title":"Computer vision \u2013 ECCV 2014","first-page":"489","article-title":"Action-reaction: forecasting the dynamics of human interaction","author":"Huang","year":"2014"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0245","series-title":"2011 IEEE international conference on computer vision (ICCV)","first-page":"1036","article-title":"Human activity prediction: early recognition of ongoing activities from streaming videos","author":"Ryoo","year":"2011"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0250","series-title":"2013 IEEE conference on computer vision and pattern recognition (CVPR)","first-page":"2658","article-title":"Recognize human activities from partially observed videos","author":"Cao","year":"2013"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0255","series-title":"2013 IEEE international conference on computer vision (ICCV)","first-page":"2224","article-title":"Inferring \u201cdark matter\u201d and \u201cdark energy\u201d from videos","author":"Xie","year":"2013"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0260","series-title":"Computer vision \u2013 ECCV 2014","first-page":"421","article-title":"Predicting actions from static scenes","author":"Vu","year":"2014"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0265","series-title":"Proceedings of the 21st ACM SIGKDD international conference on knowledge discovery and data mining","first-page":"805","article-title":"Data-driven activity prediction: algorithms, evaluation methodology, and applications","author":"Minor","year":"2015"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0270","series-title":"13th international conference on machine learning and applications (ICMLA)","first-page":"47","article-title":"Bayesian nonparametric inverse reinforcement learning for switched Markov decision processes","author":"Surana","year":"2014"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0275","author":"Ranzato"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0280","author":"Srivastava"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0285","author":"Vondrick"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0290","author":"Ryoo"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0295","series-title":"2011 IEEE conference on computer vision and pattern recognition (CVPR)","first-page":"3241","article-title":"Fast unsupervised ego-action learning for first-person sports videos","author":"Kitani","year":"2011"},{"issue":"8","key":"10.1016\/B978-0-12-809276-7.00011-4_br0300","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","article-title":"Long short-term memory","volume":"9","author":"Hochreiter","year":"1997","journal-title":"Neural Comput"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0305","author":"Chung"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0310","author":"Chorowski"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0315","author":"Chung"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0320","author":"Vinyals"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0325","series-title":"NIPS","article-title":"Deep fragment embeddings for bidirectional image sentence mapping","author":"Karpathy","year":"2014"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0330","author":"Yoo"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0335","author":"Donahue"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0340","author":"Xu"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0345","author":"Bahdanau"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0350","series-title":"ICCV","article-title":"Look and think twice: capturing top-down visual attention with feedback convolutional neural networks","author":"Cao","year":"2015"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0355","author":"Gregor"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0360","author":"Xiao"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0365","author":"Ng"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0370","series-title":"ICCV","article-title":"Recurrent network models for human dynamics","author":"Fragkiadaki","year":"2015"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0375","author":"Zheng"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0380","author":"Pinheiro"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0385","author":"Visin"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0390","author":"Dauphin"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0395","unstructured":"Bergstra J, Breuleux O, Bastien F, Lamblin P, Pascanu R, Desjardins G, Turian J, Warde-Farley D, Bengio Y. Theano: a CPU and GPU math compiler in Python."},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0400","series-title":"2013 IEEE international conference on robotics and automation (ICRA)","first-page":"2153","article-title":"Robot navigation in dense human crowds: the case for cooperation","author":"Trautman","year":"2013"},{"key":"10.1016\/B978-0-12-809276-7.00011-4_br0405","series-title":"2010 IEEE\/RSJ international conference on intelligent robots and systems (IROS)","first-page":"797","article-title":"Unfreezing the robot: navigation in dense, interacting crowds","author":"Trautman","year":"2010"}],"container-title":["Group and Crowd Behavior for Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:B9780128092767000114?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:B9780128092767000114?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2018,9,2]],"date-time":"2018-09-02T14:22:14Z","timestamp":1535898134000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/B9780128092767000114"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017]]},"ISBN":["9780128092767"],"references-count":81,"URL":"https:\/\/doi.org\/10.1016\/b978-0-12-809276-7.00011-4","relation":{},"subject":[],"published":{"date-parts":[[2017]]}}}