{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T16:58:31Z","timestamp":1777654711280,"version":"3.51.4"},"reference-count":42,"publisher":"American Association for the Advancement of Science (AAAS)","issue":"46","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Sci. Adv."],"published-print":{"date-parts":[[2021,11,12]]},"abstract":"<jats:p>Deep learning using audiovisual data from chimpanzee percussive behaviors enables action recognition in the wild.<\/jats:p>","DOI":"10.1126\/sciadv.abi4883","type":"journal-article","created":{"date-parts":[[2021,11,12]],"date-time":"2021-11-12T18:56:46Z","timestamp":1636743406000},"source":"Crossref","is-referenced-by-count":82,"title":["Automated audiovisual behavior recognition in wild primates"],"prefix":"10.1126","volume":"7","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-2345-5441","authenticated-orcid":true,"given":"Max","family":"Bain","sequence":"first","affiliation":[{"name":"Visual Geometry Group, Department of Engineering Science, University of Oxford, Oxford, UK."}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2190-9013","authenticated-orcid":true,"given":"Arsha","family":"Nagrani","sequence":"additional","affiliation":[{"name":"Visual Geometry Group, Department of Engineering Science, University of Oxford, Oxford, UK."}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3308-0209","authenticated-orcid":true,"given":"Daniel","family":"Schofield","sequence":"additional","affiliation":[{"name":"Primate Models for Behavioural Evolution Lab, Institute of Human Sciences, School of Anthropology and Museum Ethnography, University of Oxford, Oxford, UK."}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2162-1087","authenticated-orcid":true,"given":"Sophie","family":"Berdugo","sequence":"additional","affiliation":[{"name":"Primate Models for Behavioural Evolution Lab, Institute of Human Sciences, School of Anthropology and Museum Ethnography, University of Oxford, Oxford, UK."},{"name":"Social Body Lab, Institute of Human Sciences, School of Anthropology and Museum Ethnography, University of Oxford, Oxford, UK."}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7196-5369","authenticated-orcid":true,"given":"Joana","family":"Bessa","sequence":"additional","affiliation":[{"name":"Department of Zoology, University of Oxford, Oxford, UK."}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8490-3949","authenticated-orcid":true,"given":"Jake","family":"Owen","sequence":"additional","affiliation":[{"name":"Department of Zoology, University of Oxford, Oxford, UK."}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6187-644X","authenticated-orcid":true,"given":"Kimberley J.","family":"Hockings","sequence":"additional","affiliation":[{"name":"Centre for Ecology and Conservation, College of Life and Environmental Sciences, University of Exeter, Exeter, UK."}]},{"given":"Tetsuro","family":"Matsuzawa","sequence":"additional","affiliation":[{"name":"Division of the Humanities and Social Sciences, California Institute of Technology, 1200 E. California Blvd., MC 228-77, Pasadena, CA 91125, USA."}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7289-6414","authenticated-orcid":true,"given":"Misato","family":"Hayashi","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3408-6274","authenticated-orcid":true,"given":"Dora","family":"Biro","sequence":"additional","affiliation":[{"name":"Department of Zoology, University of Oxford, Oxford, UK."},{"name":"Department of Brain and Cognitive Sciences, University of Rochester, Rochester, NY, USA."}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4542-3720","authenticated-orcid":true,"given":"Susana","family":"Carvalho","sequence":"additional","affiliation":[{"name":"Primate Models for Behavioural Evolution Lab, Institute of Human Sciences, School of Anthropology and Museum Ethnography, University of Oxford, Oxford, UK."},{"name":"Gorongosa National Park, Sofala, Mozambique."},{"name":"Centre for Functional Ecology, Department of Life Sciences, Coimbra University, Coimbra, Portugal."},{"name":"Interdisciplinary Centre for Archaeology and Evolution of Human Behaviour, Algarve University, Faro, Portugal."}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8945-8573","authenticated-orcid":true,"given":"Andrew","family":"Zisserman","sequence":"additional","affiliation":[{"name":"Visual Geometry Group, Department of Engineering Science, University of Oxford, Oxford, UK."}]}],"member":"221","reference":[{"key":"e_1_3_3_2_2","doi-asserted-by":"publisher","DOI":"10.1111\/j.1439-0310.1963.tb01161.x"},{"key":"e_1_3_3_3_2","doi-asserted-by":"publisher","DOI":"10.1016\/j.tree.2013.06.002"},{"key":"e_1_3_3_4_2","doi-asserted-by":"publisher","DOI":"10.1016\/j.neuron.2014.09.005"},{"key":"e_1_3_3_5_2","doi-asserted-by":"publisher","DOI":"10.1038\/s41386-020-0776-y"},{"key":"e_1_3_3_6_2","doi-asserted-by":"publisher","DOI":"10.1016\/j.jneumeth.2019.108536"},{"key":"e_1_3_3_7_2","first-page":"e01510","article-title":"Giant panda behaviour recognition using images","volume":"26","author":"Swarup P.","year":"2021","unstructured":"P. Swarup, P. Chen, R. Hou, P. Que, P. Liu, A. W. K. Kong, Giant panda behaviour recognition using images. Glob. Ecol. Conserv. 26, e01510 (2021).","journal-title":"Glob. Ecol. Conserv."},{"key":"e_1_3_3_8_2","doi-asserted-by":"publisher","DOI":"10.1098\/rsbl.2019.0695"},{"key":"e_1_3_3_9_2","doi-asserted-by":"publisher","DOI":"10.1111\/1365-2656.13336"},{"key":"e_1_3_3_10_2","doi-asserted-by":"publisher","DOI":"10.1038\/s41559-020-1135-4"},{"key":"e_1_3_3_11_2","doi-asserted-by":"publisher","DOI":"10.1093\/beheco\/art086"},{"key":"e_1_3_3_12_2","doi-asserted-by":"publisher","DOI":"10.1002\/rse2.48"},{"key":"e_1_3_3_13_2","doi-asserted-by":"publisher","DOI":"10.1163\/156853901317367717"},{"key":"e_1_3_3_14_2","unstructured":"M. Bain A. Nagrani D. Schofield A. Zisserman in Workshop on Computer Vision for Wildlife Conservation ICCV (IEEE 2019)."},{"key":"e_1_3_3_15_2","doi-asserted-by":"publisher","DOI":"10.1126\/sciadv.aaw0736"},{"key":"e_1_3_3_16_2","doi-asserted-by":"publisher","DOI":"10.1038\/s41593-018-0209-y"},{"key":"e_1_3_3_17_2","doi-asserted-by":"crossref","unstructured":"D. Shao Y. Zhao B. Dai D. Lin FineGym: A hierarchical video dataset for fine-grained action understanding in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (IEEE 2020) pp. 2616\u20132625.","DOI":"10.1109\/CVPR42600.2020.00269"},{"key":"e_1_3_3_18_2","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.1719367115"},{"key":"e_1_3_3_19_2","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2012.59"},{"key":"e_1_3_3_20_2","doi-asserted-by":"crossref","unstructured":"J. Carreira A. Zisserman Quo Vadis action recognition? A new model and the kinetics dataset in Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (IEEE 2017) pp. 6299\u20136308.","DOI":"10.1109\/CVPR.2017.502"},{"key":"e_1_3_3_21_2","unstructured":"F. Sakib T. Burghardt Visual recognition of great ape behaviours in the wild. arXiv:2011.10759 [cs.CV] (21 November 2020); http:\/\/arxiv.org\/abs\/2011.10759."},{"key":"e_1_3_3_22_2","doi-asserted-by":"crossref","unstructured":"R. Gao T.-H. Oh K. Grauman L. Torresani Listen to Look: Action recognition by previewing audio in Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (IEEE 2020) pp. 10457\u201310467.","DOI":"10.1109\/CVPR42600.2020.01047"},{"key":"e_1_3_3_23_2","unstructured":"T. Matsuzawa Field experiments on use of stone tools by chimpanzees in the wild in Chimpanzee Cultures R. W. Wrangham W. C. McGrew F. B. M. de Wall P. G. Heltne Eds. (Harvard Univ. Press 1994) pp. 351\u2013370."},{"key":"e_1_3_3_24_2","doi-asserted-by":"publisher","DOI":"10.3389\/fevo.2021.625303"},{"key":"e_1_3_3_25_2","doi-asserted-by":"publisher","DOI":"10.1007\/s10071-003-0183-x"},{"key":"e_1_3_3_26_2","doi-asserted-by":"publisher","DOI":"10.1007\/BF02557572"},{"key":"e_1_3_3_27_2","doi-asserted-by":"crossref","unstructured":"D. Deb S. Wiper A. Russo S. Gong Y. Shi C. Tymoszek A. Jain Face recognition: Primates in the wild arXiv:1804.08790 [cs.CV] (24 April 2018); http:\/\/arxiv.org\/abs\/1804.08790.","DOI":"10.1109\/BTAS.2018.8698538"},{"key":"e_1_3_3_28_2","doi-asserted-by":"publisher","DOI":"10.1038\/s41467-021-22970-y"},{"key":"e_1_3_3_29_2","doi-asserted-by":"publisher","DOI":"10.1126\/science.aau4532"},{"key":"e_1_3_3_30_2","doi-asserted-by":"publisher","DOI":"10.1111\/2041-210X.13504"},{"key":"e_1_3_3_31_2","doi-asserted-by":"crossref","unstructured":"T. Han W. Xie A. Zisserman Video representation learning by dese predictive coding in Proceedings of the IEEE International Conference on Computer Vision Workshops (IEEE 2019) pp. 1483\u20131492.","DOI":"10.1109\/ICCVW.2019.00186"},{"key":"e_1_3_3_32_2","doi-asserted-by":"crossref","unstructured":"T. Matsuzawa T. Humle Y. Sugiyama The Chimpanzees of Bossou and Nimba (Springer Science & Business Media 2011).","DOI":"10.1007\/978-4-431-53921-6"},{"key":"e_1_3_3_33_2","doi-asserted-by":"publisher","DOI":"10.1016\/j.jhevol.2008.02.005"},{"key":"e_1_3_3_34_2","doi-asserted-by":"publisher","DOI":"10.1007\/BF02435610"},{"key":"e_1_3_3_35_2","doi-asserted-by":"crossref","unstructured":"T. Nishida Chimpanzees of the Lakeshore: Natural History and Culture at Mahale (Cambridge Univ. Press 2011).","DOI":"10.1017\/CBO9781139059497"},{"key":"e_1_3_3_36_2","doi-asserted-by":"publisher","DOI":"10.1002\/ajpa.22634"},{"key":"e_1_3_3_37_2","doi-asserted-by":"crossref","unstructured":"V. Reynolds The Chimpanzees of the Budongo Forest: Ecology Behaviour and Conservation (OUP Oxford 2005).","DOI":"10.1093\/acprof:oso\/9780198515463.001.0001"},{"key":"e_1_3_3_38_2","doi-asserted-by":"crossref","unstructured":"W. Liu D. Anguelov D. Erhan C. Szegedy S. Reed C.-Y. Fu A. C. Berg European Conference on Computer Vision (Springer 2016) pp. 21\u201337.","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"e_1_3_3_39_2","unstructured":"A. Dutta A. Zisserman in Proceedings of the 27th ACM International Conference on Multimedia (MM \u201819) (Association for Computing Machinery 2019) pp. 2276\u20132279."},{"key":"e_1_3_3_40_2","doi-asserted-by":"crossref","unstructured":"H. Chen W. Xie A. Vedaldi A. Zisserman Vggsound: A large-scale audio-visual dataset in Proceedings of ICASSP 2020\u20132020 IEEE International Conference on Acoustics Speech and Signal Processing (ICASSP) (IEEE 2020) pp. 721\u2013725.","DOI":"10.1109\/ICASSP40776.2020.9053174"},{"key":"e_1_3_3_41_2","doi-asserted-by":"crossref","unstructured":"J. Yu H. Su J. Liu Z. Yang Z. Zhang Y. Zhu L. Yang B. Jiao A Strong Baseline for Tiger Re-ID and its Bag of Tricks in Proceedings of the IEEE International Conference on Computer Vision Workshops (IEEE 2019) pp. 302\u2013309.","DOI":"10.1109\/ICCVW.2019.00040"},{"key":"e_1_3_3_42_2","doi-asserted-by":"publisher","DOI":"10.1002\/ece3.6152"},{"key":"e_1_3_3_43_2","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-009-0275-4"}],"container-title":["Science Advances"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.science.org\/doi\/pdf\/10.1126\/sciadv.abi4883","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,9]],"date-time":"2024-01-09T18:27:42Z","timestamp":1704824862000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.science.org\/doi\/10.1126\/sciadv.abi4883"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,11,12]]},"references-count":42,"journal-issue":{"issue":"46","published-print":{"date-parts":[[2021,11,12]]}},"alternative-id":["10.1126\/sciadv.abi4883"],"URL":"https:\/\/doi.org\/10.1126\/sciadv.abi4883","relation":{},"ISSN":["2375-2548"],"issn-type":[{"value":"2375-2548","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021,11,12]]},"article-number":"eabi4883"}}