{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T05:15:25Z","timestamp":1755839725455,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":36,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,5,30]],"date-time":"2024-05-30T00:00:00Z","timestamp":1717027200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"Zhejiang Lab.","award":["2019KD0AD011005"],"award-info":[{"award-number":["2019KD0AD011005"]}]},{"name":"National Key Research and Development Project of China","award":["2020AAA0104001"],"award-info":[{"award-number":["2020AAA0104001"]}]},{"name":"Zhejiang Provincial Science and Technology Planning Key Project of China","award":["2021C03129"],"award-info":[{"award-number":["2021C03129"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,5,30]]},"DOI":"10.1145\/3652583.3658025","type":"proceedings-article","created":{"date-parts":[[2024,6,7]],"date-time":"2024-06-07T06:30:40Z","timestamp":1717741840000},"page":"925-933","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":1,"title":["BFIDet: A YOLOv7-improved Vehicle and Pedestrian Detector via Balancing Feature Integration"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-3710-2345","authenticated-orcid":false,"given":"Anrui","family":"Wang","sequence":"first","affiliation":[{"name":"Zhejiang University of Technology, Hangzhou, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2496-6291","authenticated-orcid":false,"given":"Libo","family":"Weng","sequence":"additional","affiliation":[{"name":"Zhejiang University of Technology, Hangzhou, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4678-1936","authenticated-orcid":false,"given":"Fei","family":"Gao","sequence":"additional","affiliation":[{"name":"Zhejiang University of Technology, Hangzhou, China"}]}],"member":"320","published-online":{"date-parts":[[2024,6,7]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2021.108102"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2022.119108"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.engappai.2022.104914"},{"key":"e_1_3_2_1_4_1","volume-title":"Yolox: Exceeding yolo series","author":"Ge Zheng","year":"2021","unstructured":"Zheng Ge, Songtao Liu, Feng Wang, Zeming Li, and Jian Sun. Yolox: Exceeding yolo series in 2021. arXiv preprint arXiv:2107.08430, 2021."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1177\/0278364913491297"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.81"},{"key":"e_1_3_2_1_7_1","volume-title":"Soda10m: a largescale 2d self\/semi-supervised object detection dataset for autonomous driving. arXiv preprint arXiv:2106.11118","author":"Han Jianhua","year":"2021","unstructured":"Jianhua Han, Xiwen Liang, Hang Xu, Kai Chen, Lanqing Hong, Jiageng Mao, Chaoqiang Ye, Wei Zhang, Zhenguo Li, Xiaodan Liang, et al. Soda10m: a largescale 2d self\/semi-supervised object detection dataset for autonomous driving. arXiv preprint arXiv:2106.11118, 2021."},{"key":"e_1_3_2_1_8_1","volume-title":"Ratio-and-scale-aware yolo for pedestrian detection","author":"Hsu Wei-Yen","year":"2020","unstructured":"Wei-Yen Hsu and Wen-Yen Lin. Ratio-and-scale-aware yolo for pedestrian detection. IEEE transactions on image processing, 30:934--947, 2020."},{"key":"e_1_3_2_1_9_1","volume-title":"Accessed: 5th","author":"Jocher G.","year":"2024","unstructured":"G. Jocher, A. Chaurasia, J. Qiu, and et al. Ultralytics YOLO(2023). https:\/\/github.com\/ultralytics\/ultralytics. Accessed: 5th Jan, 2024."},{"key":"e_1_3_2_1_10_1","volume-title":"Accessed: 14th","author":"Jocher G.","year":"2023","unstructured":"G. Jocher, A. Chaurasia, A. Stoken, and et al. ultralytics\/yolov5(2020). https:\/\/github.com\/ultralytics\/yolov5. Accessed: 14th Dec, 2023."},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2023.121209"},{"key":"e_1_3_2_1_12_1","volume-title":"Yolov6: A single-stage object detection framework for industrial applications. arXiv preprint arXiv:2209.02976","author":"Li Chuyi","year":"2022","unstructured":"Chuyi Li, Lulu Li, Hongliang Jiang, Kaiheng Weng, Yifei Geng, Liang Li, Zaidan Ke, Qingyuan Li, Meng Cheng, Weiqiang Nie, et al. Yolov6: A single-stage object detection framework for industrial applications. arXiv preprint arXiv:2209.02976, 2022."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1080\/09540091.2023.2166903"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.324"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2023.109878"},{"key":"e_1_3_2_1_16_1","first-page":"1","volume-title":"Applied Intelligence","author":"Liu Mingsheng","year":"2023","unstructured":"Mingsheng Liu, Liang Wan, Bo Wang, and Tingting Wang. Se-yolov4: shuffle expansion yolov4 for pedestrian detection based on pixelshuffle. Applied Intelligence, pages 1--18, 2023."},{"key":"e_1_3_2_1_17_1","first-page":"21","volume-title":"Proceedings, Part I 14","author":"Liu Wei","year":"2016","unstructured":"Wei Liu, Dragomir Anguelov, Dumitru Erhan, Christian Szegedy, Scott Reed, Cheng-Yang Fu, and Alexander C Berg. Ssd: Single shot multibox detector. In Computer Vision--ECCV 2016: 14th European Conference, Amsterdam, The Netherlands, October 11--14, 2016, Proceedings, Part I 14, pages 21--37. Springer, 2016."},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN54540.2023.10191242"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1109\/WACV48630.2021.00318"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.engappai.2022.105705"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.3390\/electronics11142162"},{"key":"e_1_3_2_1_22_1","volume-title":"Yolov3: An incremental improvement. arXiv preprint arXiv:1804.02767","author":"Redmon Joseph","year":"2018","unstructured":"Joseph Redmon and Ali Farhadi. Yolov3: An incremental improvement. arXiv preprint arXiv:1804.02767, 2018."},{"key":"e_1_3_2_1_23_1","volume-title":"Faster r-cnn: Towards real-time object detection with region proposal networks. Advances in neural information processing systems, 28","author":"Ren Shaoqing","year":"2015","unstructured":"Shaoqing Ren, Kaiming He, Ross Girshick, and Jian Sun. Faster r-cnn: Towards real-time object detection with region proposal networks. Advances in neural information processing systems, 28, 2015."},{"key":"e_1_3_2_1_24_1","first-page":"1","volume-title":"Multimedia Tools and Applications","author":"Singh Navjot","year":"2023","unstructured":"Navjot Singh, Paras Saini, Om Shubham, Rituraj Awasthi, Anurag Bharti, and Neetesh Kumar. Improved yolov5l for vehicle detection: an application to estimating traffic density and identifying over speeding vehicles on highway scenes. Multimedia Tools and Applications, pages 1--31, 2023."},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1080\/09540091.2023.2168254"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v31i1.11231"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/3488933.3489039"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2020.3041278"},{"key":"e_1_3_2_1_29_1","first-page":"7464","volume-title":"Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition","author":"Bochkovskiy Alexey","year":"2023","unstructured":"Chien-YaoWang, Alexey Bochkovskiy, and Hong-Yuan Mark Liao. Yolov7: Trainable bag-of-freebies sets new state-of-the-art for real-time object detectors. In Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pages 7464--7475, 2023."},{"key":"e_1_3_2_1_30_1","first-page":"11534","volume-title":"Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition","author":"Zhu Pengfei","year":"2020","unstructured":"QilongWang, BangguWu, Pengfei Zhu, Peihua Li,Wangmeng Zuo, and Qinghua Hu. Eca-net: Efficient channel attention for deep convolutional neural networks. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pages 11534--11542, 2020."},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10489-021-03061-3"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1109\/BIBM49941.2020.9313473"},{"key":"e_1_3_2_1_33_1","first-page":"1","volume-title":"The Visual Computer","author":"Yang Tiejun","year":"2021","unstructured":"Tiejun Yang, Ruiqiang Liang, and Lin Huang. Vehicle counting method based on attention mechanism ssd and state detection. The Visual Computer, pages 1--11, 2021."},{"key":"e_1_3_2_1_34_1","first-page":"18","volume-title":"International Conference on Algorithms and Architectures for Parallel Processing","author":"Zhang JIN","year":"2021","unstructured":"JIN Zhang, Meng Luo, Cheng Sun, and Peiqi Qu. Bfr-retinanet: An improved retinanet model for vehicle detection in aerial images. In International Conference on Algorithms and Architectures for Parallel Processing, pages 18--32. Springer, 2021."},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1049\/ipr2.12297"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW54120.2021.00312"}],"event":{"name":"ICMR '24: International Conference on Multimedia Retrieval","sponsor":["SIGMM ACM Special Interest Group on Multimedia","SIGSOFT ACM Special Interest Group on Software Engineering"],"location":"Phuket Thailand","acronym":"ICMR '24"},"container-title":["Proceedings of the 2024 International Conference on Multimedia Retrieval"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3652583.3658025","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3652583.3658025","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,21]],"date-time":"2025-08-21T08:48:38Z","timestamp":1755766118000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3652583.3658025"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,5,30]]},"references-count":36,"alternative-id":["10.1145\/3652583.3658025","10.1145\/3652583"],"URL":"https:\/\/doi.org\/10.1145\/3652583.3658025","relation":{},"subject":[],"published":{"date-parts":[[2024,5,30]]},"assertion":[{"value":"2024-06-07","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}