{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,24]],"date-time":"2025-08-24T00:01:31Z","timestamp":1755993691274,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":52,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,7,24]],"date-time":"2024-07-24T00:00:00Z","timestamp":1721779200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,7,24]]},"DOI":"10.1145\/3671016.3671392","type":"proceedings-article","created":{"date-parts":[[2024,7,17]],"date-time":"2024-07-17T20:19:32Z","timestamp":1721247572000},"page":"437-446","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Reduce Detection Latency of YOLOv5 to Prevent Real-Time Tracking Failures for Lightweight Robots"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-6115-6506","authenticated-orcid":false,"given":"Jianxin","family":"Xue","sequence":"first","affiliation":[{"name":"School of Computer and Information Engineering, Shanghai Polytechnic University, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-1383-0036","authenticated-orcid":false,"given":"Husheng","family":"Chen","sequence":"additional","affiliation":[{"name":"School of Computer and Information Engineering, Shanghai Polytechnic University, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-0633-6811","authenticated-orcid":false,"given":"Yaohua","family":"Hu","sequence":"additional","affiliation":[{"name":"School of Computer and Information Engineering, Shanghai Polytechnic University, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-3406-7520","authenticated-orcid":false,"given":"Minyu","family":"Chen","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-8259-2200","authenticated-orcid":false,"given":"Ling-I","family":"Wu","sequence":"additional","affiliation":[{"name":"Shanghai Jiao Tong University, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9212-9810","authenticated-orcid":false,"given":"Xi","family":"Chang","sequence":"additional","affiliation":[{"name":"School of Computer and Information Engineering, Shanghai Polytechnic University, China"}]}],"member":"320","published-online":{"date-parts":[[2024,7,24]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICACCS48705.2020.9074315"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1109\/TENCON.2017.8228388"},{"key":"e_1_3_2_1_3_1","first-page":"3782","article-title":"AP-loss for accurate one-stage object detection","volume":"43","author":"Wang Ji","year":"2020","unstructured":"Kean Chen, Weiyao Lin, Jianguo Li, John See, Ji Wang, and Junni Zou. 2020. AP-loss for accurate one-stage object detection. IEEE Transactions on Pattern Analysis and Machine Intelligence 43, 11 (2020), 3782\u20133798.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"e_1_3_2_1_4_1","volume-title":"PP-LCNet: A lightweight CPU convolutional neural network. arXiv preprint arXiv:2109.15099","author":"Cui Cheng","year":"2021","unstructured":"Cheng Cui, Tingquan Gao, Shengyu Wei, Yuning Du, Ruoyu Guo, Shuilong Dong, Bin Lu, Ying Zhou, Xueying Lv, Qiwen Liu, 2021. PP-LCNet: A lightweight CPU convolutional neural network. arXiv preprint arXiv:2109.15099 (2021)."},{"key":"e_1_3_2_1_5_1","volume-title":"PP-LCNet: A lightweight CPU convolutional neural network. arXiv preprint arXiv:2109.15099","author":"Cui Cheng","year":"2021","unstructured":"Cheng Cui, Tingquan Gao, Shengyu Wei, Yuning Du, Ruoyu Guo, Shuilong Dong, Bin Lu, Ying Zhou, Xueying Lv, Qiwen Liu, 2021. PP-LCNet: A lightweight CPU convolutional neural network. arXiv preprint arXiv:2109.15099 (2021)."},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00729"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.3390\/electronics11203263"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"crossref","unstructured":"Markus Eisenbach Alexander Vorndran Sven Sorge and Horst-Michael Gross. 2015. User recognition for guiding and following people with a mobile robot in a clinical environment. (2015) 3600\u20133607.","DOI":"10.1109\/IROS.2015.7353880"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.3390\/s130911603"},{"key":"e_1_3_2_1_10_1","volume-title":"Dssd: Deconvolutional single shot detector. arXiv preprint arXiv:1701.06659","author":"Fu Cheng-Yang","year":"2017","unstructured":"Cheng-Yang Fu, Wei Liu, Ananth Ranga, Ambrish Tyagi, and Alexander\u00a0C Berg. 2017. Dssd: Deconvolutional single shot detector. arXiv preprint arXiv:1701.06659 (2017)."},{"key":"e_1_3_2_1_11_1","volume-title":"Survey of pedestrian detection for advanced driver assistance systems","author":"Geronimo David","year":"2009","unstructured":"David Geronimo, Antonio\u00a0M Lopez, Angel\u00a0D Sappa, and Thorsten Graf. 2009. Survey of pedestrian detection for advanced driver assistance systems. IEEE transactions on pattern analysis and machine intelligence 32, 7 (2009), 1239\u20131258."},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00720"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.169"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.81"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.322"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.3390\/s23177596"},{"key":"e_1_3_2_1_17_1","volume-title":"An end-to-end 3d convolutional neural network for action detection and segmentation in videos. arXiv preprint arXiv:1712.01111","author":"Hou Rui","year":"2017","unstructured":"Rui Hou, Chen Chen, and Mubarak Shah. 2017. An end-to-end 3d convolutional neural network for action detection and segmentation in videos. arXiv preprint arXiv:1712.01111 (2017)."},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00140"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01509"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1177\/0278364919881683"},{"key":"e_1_3_2_1_21_1","volume-title":"3D convolutional neural networks for human action recognition","author":"Ji Shuiwang","year":"2012","unstructured":"Shuiwang Ji, Wei Xu, Ming Yang, and Kai Yu. 2012. 3D convolutional neural networks for human action recognition. IEEE transactions on pattern analysis and machine intelligence 35, 1 (2012), 221\u2013231."},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00656"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.113"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2021.3053956"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.324"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.engappai.2023.106217"},{"key":"e_1_3_2_1_27_1","volume-title":"Proceedings, Part I 14","author":"Liu Wei","year":"2016","unstructured":"Wei Liu, Dragomir Anguelov, Dumitru Erhan, Christian Szegedy, Scott Reed, Cheng-Yang Fu, and Alexander\u00a0C Berg. 2016. Ssd: Single shot multibox detector. In Computer Vision\u2013ECCV 2016: 14th European Conference, Amsterdam, The Netherlands, October 11\u201314, 2016, Proceedings, Part I 14. Springer, 21\u201337."},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.3390\/s19163542"},{"key":"e_1_3_2_1_29_1","volume-title":"Real-time human detection in thermal infrared imaging at night using enhanced Tiny-yolov3 network. Journal of Real-Time Image Processing","author":"Manssor AF","year":"2022","unstructured":"Samah\u00a0AF Manssor, Shaoyuan Sun, Mohammed Abdalmajed, and Shima Ali. 2022. Real-time human detection in thermal infrared imaging at night using enhanced Tiny-yolov3 network. Journal of Real-Time Image Processing (2022), 1\u201314."},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1145\/3266157.3266221"},{"key":"e_1_3_2_1_31_1","first-page":"15534","article-title":"A ranking-based, balanced loss function unifying classification and localisation in object detection","volume":"33","author":"Oksuz Kemal","year":"2020","unstructured":"Kemal Oksuz, Baris\u00a0Can Cam, Emre Akbas, and Sinan Kalkan. 2020. A ranking-based, balanced loss function unifying classification and localisation in object detection. Advances in Neural Information Processing Systems 33 (2020), 15534\u201315545.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01008"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.91"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.690"},{"key":"e_1_3_2_1_35_1","volume-title":"Yolov3: An incremental improvement. arXiv preprint arXiv:1804.02767","author":"Redmon Joseph","year":"2018","unstructured":"Joseph Redmon and Ali Farhadi. 2018. Yolov3: An incremental improvement. arXiv preprint arXiv:1804.02767 (2018)."},{"volume-title":"Object detection from video using temporal convolutional network. In 2018 IEEE Recent Advances in Intelligent Computational Systems (RAICS)","author":"Sabu Lizabeth","key":"e_1_3_2_1_36_1","unstructured":"ELizabeth Sabu and K Suresh. 2018. Object detection from video using temporal convolutional network. In 2018 IEEE Recent Advances in Intelligent Computational Systems (RAICS). IEEE, 11\u201315."},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00474"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i2.25320"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01079"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"crossref","unstructured":"Ryosuke Tasaki Michiteru Kitazaki Jun Miura and Kazuhiko Terashima. 2015. Prototype design of medical round supporting robot \u201cTerapio\u201d. (2015) 829\u2013834.","DOI":"10.1109\/ICRA.2015.7139274"},{"key":"e_1_3_2_1_41_1","first-page":"34899","article-title":"Fully convolutional one-stage 3d object detection on lidar range images","volume":"35","author":"Tian Zhi","year":"2022","unstructured":"Zhi Tian, Xiangxiang Chu, Xiaoming Wang, Xiaolin Wei, and Chunhua Shen. 2022. Fully convolutional one-stage 3d object detection on lidar range images. Advances in Neural Information Processing Systems 35 (2022), 34899\u201334911.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00972"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00721"},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01559"},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.displa.2023.102403"},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW54120.2021.00107"},{"key":"e_1_3_2_1_47_1","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0259283"},{"key":"e_1_3_2_1_48_1","volume-title":"International Conference on Machine Learning. PMLR, 10524\u201310533","author":"Xiong Ruibin","year":"2020","unstructured":"Ruibin Xiong, Yunchang Yang, Di He, Kai Zheng, Shuxin Zheng, Chen Xing, Huishuai Zhang, Yanyan Lan, Liwei Wang, and Tieyan Liu. 2020. On layer normalization in the transformer architecture. In International Conference on Machine Learning. PMLR, 10524\u201310533."},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"publisher","DOI":"10.3390\/app122312312"},{"key":"e_1_3_2_1_50_1","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.3044564"},{"key":"e_1_3_2_1_51_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00716"},{"key":"e_1_3_2_1_52_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6999"}],"event":{"name":"Internetware 2024: 15th Asia-Pacific Symposium on Internetware","sponsor":["SIGSOFT ACM Special Interest Group on Software Engineering"],"location":"Macau China","acronym":"Internetware 2024"},"container-title":["Proceedings of the 15th Asia-Pacific Symposium on Internetware"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3671016.3671392","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3671016.3671392","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,23]],"date-time":"2025-08-23T00:37:58Z","timestamp":1755909478000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3671016.3671392"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,7,24]]},"references-count":52,"alternative-id":["10.1145\/3671016.3671392","10.1145\/3671016"],"URL":"https:\/\/doi.org\/10.1145\/3671016.3671392","relation":{},"subject":[],"published":{"date-parts":[[2024,7,24]]},"assertion":[{"value":"2024-07-24","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}