{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T01:40:48Z","timestamp":1755826848147,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":34,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,3,11]],"date-time":"2024-03-11T00:00:00Z","timestamp":1710115200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,3,11]]},"DOI":"10.1145\/3610978.3640648","type":"proceedings-article","created":{"date-parts":[[2024,3,10]],"date-time":"2024-03-10T22:55:43Z","timestamp":1710111343000},"page":"1199-1203","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Improving Visual Perception of a Social Robot for Controlled and In-the-wild Human-robot Interaction"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0005-6428-916X","authenticated-orcid":false,"given":"Wangjie","family":"Zhong","sequence":"first","affiliation":[{"name":"Faculty of IT, Monash University, Melbourne, Australia"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8559-5610","authenticated-orcid":false,"given":"Leimin","family":"Tian","sequence":"additional","affiliation":[{"name":"Faculty of Engineering, Monash University, Melbourne, Australia"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2356-4530","authenticated-orcid":false,"given":"Duy Tho","family":"Le","sequence":"additional","affiliation":[{"name":"Faculty of IT, Monash University, Melbourne, Australia"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8659-8773","authenticated-orcid":false,"given":"Hamid","family":"Rezatofighi","sequence":"additional","affiliation":[{"name":"Faculty of IT, Monash University, Melbourne, Australia"}]}],"member":"320","published-online":{"date-parts":[[2024,3,11]]},"reference":[{"key":"e_1_3_2_2_1_1","volume-title":"BoT-SORT: Robust associations multi-pedestrian tracking. arXiv preprint arXiv:2206.14651","author":"Aharon Nir","year":"2022","unstructured":"Nir Aharon, Roy Orfaig, and Ben-Zion Bobrovsky. 2022. BoT-SORT: Robust associations multi-pedestrian tracking. arXiv preprint arXiv:2206.14651 (2022)."},{"key":"e_1_3_2_2_2_1","doi-asserted-by":"publisher","DOI":"10.1007\/s12369-015-0298-7"},{"key":"e_1_3_2_2_3_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58799-4_69"},{"key":"e_1_3_2_2_4_1","doi-asserted-by":"publisher","DOI":"10.1007\/s12369-008-0001-3"},{"key":"e_1_3_2_2_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2019.2960798"},{"key":"e_1_3_2_2_6_1","doi-asserted-by":"publisher","DOI":"10.1145\/3406499.3415073"},{"key":"e_1_3_2_2_7_1","volume-title":"Adapted pepper. arXiv preprint arXiv:2009.03648","author":"Caniot Maxime","year":"2020","unstructured":"Maxime Caniot, Vincent Bonnet, Maxime Busy, Thierry Labaye, Michel Besombes, Sebastien Courtois, and Edouard Lagrue. 2020. Adapted pepper. arXiv preprint arXiv:2009.03648 (2020)."},{"key":"e_1_3_2_2_8_1","volume-title":"Observation-centric sort: Rethinking sort for robust multi-object tracking. arXiv preprint arXiv:2203.14360","author":"Cao Jinkun","year":"2022","unstructured":"Jinkun Cao, Xinshuo Weng, Rawal Khirodkar, Jiangmiao Pang, and Kris Kitani. 2022. Observation-centric sort: Rethinking sort for robust multi-object tracking. arXiv preprint arXiv:2203.14360 (2022)."},{"key":"e_1_3_2_2_9_1","volume-title":"2D Human pose estimation: a survey. Multimedia Systems","author":"Chen Haoming","year":"2022","unstructured":"Haoming Chen, Runyang Feng, Sifan Wu, Hao Xu, Fengcheng Zhou, and Zhenguang Liu. 2022. 2D Human pose estimation: a survey. Multimedia Systems (2022), 1--24."},{"key":"e_1_3_2_2_10_1","doi-asserted-by":"publisher","DOI":"10.26599\/TST.2018.9010100"},{"key":"e_1_3_2_2_11_1","doi-asserted-by":"publisher","DOI":"10.1007\/s13369-021-05401-4"},{"key":"e_1_3_2_2_12_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6724"},{"key":"e_1_3_2_2_13_1","doi-asserted-by":"publisher","DOI":"10.11591\/ijai.v12.i2.pp585-592"},{"key":"e_1_3_2_2_14_1","doi-asserted-by":"publisher","DOI":"10.1007\/s12369-020-00679-0"},{"key":"e_1_3_2_2_15_1","doi-asserted-by":"publisher","DOI":"10.1007\/s42979-022-01567-2"},{"key":"e_1_3_2_2_16_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2021.3126387"},{"key":"e_1_3_2_2_17_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR.2018.8546194"},{"key":"e_1_3_2_2_18_1","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2019.2903455"},{"key":"e_1_3_2_2_19_1","doi-asserted-by":"publisher","DOI":"10.1061\/(ASCE)CO.1943-7862.0002154"},{"key":"e_1_3_2_2_20_1","volume-title":"Multiple object tracking: A literature review. Artificial intelligence 293","author":"Luo Wenhan","year":"2021","unstructured":"Wenhan Luo, Junliang Xing, Anton Milan, Xiaoqin Zhang, Wei Liu, and Tae-Kyun Kim. 2021. Multiple object tracking: A literature review. Artificial intelligence 293 (2021), 103448."},{"key":"e_1_3_2_2_21_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW56347.2022.00297"},{"key":"e_1_3_2_2_22_1","volume-title":"Syed Muhammad Aamir, and Waseef Menhaj.","author":"Mirani Imran Khan","year":"2022","unstructured":"Imran Khan Mirani, Chen Tianhua, Malak Abid Ali Khan, Syed Muhammad Aamir, and Waseef Menhaj. 2022. Object Recognition in Different Lighting Conditions at Various Angles by Deep Learning Method. arXiv preprint arXiv:2210.09618 (2022)."},{"key":"e_1_3_2_2_23_1","volume-title":"A survey of top-down approaches for human pose estimation. arXiv preprint arXiv:2202.02656","author":"Nguyen Thong Duy","year":"2022","unstructured":"Thong Duy Nguyen and Milan Kresovic. 2022. A survey of top-down approaches for human pose estimation. arXiv preprint arXiv:2202.02656 (2022)."},{"key":"e_1_3_2_2_24_1","doi-asserted-by":"publisher","DOI":"10.1109\/MRA.2018.2833157"},{"key":"e_1_3_2_2_25_1","doi-asserted-by":"publisher","DOI":"10.1145\/3570731"},{"key":"e_1_3_2_2_26_1","doi-asserted-by":"publisher","DOI":"10.1109\/CCIS.2018.8691393"},{"key":"e_1_3_2_2_27_1","doi-asserted-by":"publisher","DOI":"10.3390\/s20205789"},{"key":"e_1_3_2_2_28_1","doi-asserted-by":"publisher","DOI":"10.1109\/HUMANOIDS.2015.7363546"},{"key":"e_1_3_2_2_29_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2012.6225287"},{"key":"e_1_3_2_2_30_1","doi-asserted-by":"publisher","DOI":"10.1108\/IJCHM-07-2020-0739"},{"key":"e_1_3_2_2_31_1","volume-title":"YOLOv7: Trainable bag-of-freebies sets new state-of-the-art for real-time object detectors. arXiv preprint arXiv:2207.02696","author":"Wang Chien-Yao","year":"2022","unstructured":"Chien-Yao Wang, Alexey Bochkovskiy, and Hong-Yuan Mark Liao. 2022. YOLOv7: Trainable bag-of-freebies sets new state-of-the-art for real-time object detectors. arXiv preprint arXiv:2207.02696 (2022)."},{"key":"e_1_3_2_2_32_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00098"},{"key":"e_1_3_2_2_33_1","volume-title":"Bytetrack: Multi-object tracking by associating every detection box. In Computer Vision--ECCV 2022: 17th European Conference, Tel Aviv, Israel, October 23--27","author":"Zhang Yifu","year":"2022","unstructured":"Yifu Zhang, Peize Sun, Yi Jiang, Dongdong Yu, Fucheng Weng, Zehuan Yuan, Ping Luo, Wenyu Liu, and Xinggang Wang. 2022. Bytetrack: Multi-object tracking by associating every detection box. In Computer Vision--ECCV 2022: 17th European Conference, Tel Aviv, Israel, October 23--27, 2022, Proceedings, Part XXII. Springer, 1--21."},{"key":"e_1_3_2_2_34_1","volume-title":"DPIT: Dual-Pipeline Integrated Transformer for Human Pose Estimation. In Artificial Intelligence: Second CAAI International Conference, CICAI 2022","author":"Zhao Shuaitao","year":"2023","unstructured":"Shuaitao Zhao, Kun Liu, Yuhang Huang, Qian Bao, Dan Zeng, and Wu Liu. 2023. DPIT: Dual-Pipeline Integrated Transformer for Human Pose Estimation. In Artificial Intelligence: Second CAAI International Conference, CICAI 2022, Beijing, China, August 27--28, 2022, Revised Selected Papers, Part II. Springer, 559--576."}],"event":{"name":"HRI '24: ACM\/IEEE International Conference on Human-Robot Interaction","sponsor":["SIGAI ACM Special Interest Group on Artificial Intelligence","SIGCHI ACM Special Interest Group on Computer-Human Interaction"],"location":"Boulder CO USA","acronym":"HRI '24"},"container-title":["Companion of the 2024 ACM\/IEEE International Conference on Human-Robot Interaction"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3610978.3640648","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3610978.3640648","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T01:26:45Z","timestamp":1755826005000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3610978.3640648"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,3,11]]},"references-count":34,"alternative-id":["10.1145\/3610978.3640648","10.1145\/3610978"],"URL":"https:\/\/doi.org\/10.1145\/3610978.3640648","relation":{},"subject":[],"published":{"date-parts":[[2024,3,11]]},"assertion":[{"value":"2024-03-11","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}