{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,2]],"date-time":"2025-11-02T17:10:38Z","timestamp":1762103438366,"version":"build-2065373602"},"reference-count":59,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2024,4,15]],"date-time":"2024-04-15T00:00:00Z","timestamp":1713139200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,4,15]],"date-time":"2024-04-15T00:00:00Z","timestamp":1713139200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["No. 62271166"],"award-info":[{"award-number":["No. 62271166"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Interdisciplinary Research Foundation of HIT","award":["No. IR2021104"],"award-info":[{"award-number":["No. IR2021104"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Machine Vision and Applications"],"published-print":{"date-parts":[[2024,5]]},"DOI":"10.1007\/s00138-024-01520-8","type":"journal-article","created":{"date-parts":[[2024,4,15]],"date-time":"2024-04-15T10:02:07Z","timestamp":1713175327000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["PTDS CenterTrack: pedestrian tracking in dense scenes with re-identification and feature enhancement"],"prefix":"10.1007","volume":"35","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-7387-4970","authenticated-orcid":false,"given":"Jiazheng","family":"Wen","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Huanyu","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Junbao","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2024,4,15]]},"reference":[{"issue":"12","key":"1520_CR1","doi-asserted-by":"publisher","first-page":"9641","DOI":"10.1109\/TPAMI.2021.3124736","volume":"44","author":"B Artacho","year":"2022","unstructured":"Artacho, B., Savakis, A.: Unipose+: a unified framework for 2d and 3d human pose estimation in images and videos. IEEE Trans. Pattern Anal. Mach. Intell. 44(12), 9641\u20139653 (2022). https:\/\/doi.org\/10.1109\/TPAMI.2021.3124736","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"1520_CR2","doi-asserted-by":"publisher","unstructured":"Ban, Y., Ba, S., Alameda-Pineda, X., et\u00a0al.: Tracking multiple persons based on a variational bayesian model. In: European Conference on Computer Vision, Springer, pp 52\u201367, https:\/\/doi.org\/10.1007\/978-3-319-48881-3_5 (2016)","DOI":"10.1007\/978-3-319-48881-3_5"},{"key":"1520_CR3","doi-asserted-by":"publisher","unstructured":"Bergmann, P., Meinhardt, T., Leal-Taixe, L.: Tracking without bells and whistles. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 941\u2013951, https:\/\/doi.org\/10.1109\/ICCV.2019.00103 (2019)","DOI":"10.1109\/ICCV.2019.00103"},{"key":"1520_CR4","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1155\/2008\/246309","volume":"2008","author":"K Bernardin","year":"2008","unstructured":"Bernardin, K., Stiefelhagen, R.: Evaluating multiple object tracking performance: the clear mot metrics. EURASIP J. Image Video Process. 2008, 1\u201310 (2008). https:\/\/doi.org\/10.1155\/2008\/246309","journal-title":"EURASIP J. Image Video Process."},{"key":"1520_CR5","unstructured":"Bertasius, G., Feichtenhofer, C., Tran, D., et\u00a0al.: Learning temporal pose estimation from sparsely-labeled videos. In: Wallach H, Larochelle H, Beygelzimer A, et\u00a0al (eds) Advances in neural information processing systems, vol\u00a032. Curran Associates, Inc., https:\/\/proceedings.neurips.cc\/paper_files\/paper\/2019\/file\/7137debd45ae4d0ab9aa953017286b20-Paper.pdf (2019)"},{"key":"1520_CR6","doi-asserted-by":"publisher","unstructured":"Bewley, A., Ge, Z., Ott, L., et\u00a0al.: Simple online and realtime tracking. In: 2016 IEEE International Conference on Image Processing (ICIP), IEEE, pp 3464\u20133468, https:\/\/doi.org\/10.1109\/ICIP.2016.7533003 (2016)","DOI":"10.1109\/ICIP.2016.7533003"},{"key":"1520_CR7","doi-asserted-by":"publisher","unstructured":"Bras\u00f3, G., Leal-Taix\u00e9, L.: Learning a neural solver for multiple object tracking. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 6247\u20136257, https:\/\/doi.org\/10.1109\/CVPR42600.2020.00628 (2020)","DOI":"10.1109\/CVPR42600.2020.00628"},{"key":"1520_CR8","doi-asserted-by":"crossref","unstructured":"Chen, D., Zhang, S., Ouyang, W., et\u00a0al.: Person search via a mask-guided two-stream CNN Model. pp 734\u2013750, https:\/\/openaccess.thecvf.com\/content_ECCV_2018\/html\/Di_Chen_Person_Search_via_ECCV_2018_paper.html (2018)","DOI":"10.1007\/978-3-030-01234-2_45"},{"key":"1520_CR9","doi-asserted-by":"publisher","unstructured":"Chen, X., Fang, H., Lin, T.Y., et\u00a0al.: Microsoft coco captions: data collection and evaluation server. arXiv:1504.00325https:\/\/doi.org\/10.48550\/arXiv.1504.00325 (2015)","DOI":"10.48550\/arXiv.1504.00325"},{"key":"1520_CR10","doi-asserted-by":"publisher","unstructured":"Ciaparrone, G., Luque S\u00e1nchez, F., Tabik, S., et al.: Deep learning in video multi-object tracking: a survey. Neurocomputing 381, 61\u201388 (2020). https:\/\/doi.org\/10.1016\/j.neucom.2019.11.023","DOI":"10.1016\/j.neucom.2019.11.023"},{"key":"1520_CR11","doi-asserted-by":"publisher","DOI":"10.5555\/3157096.3157139","author":"J Dai","year":"2016","unstructured":"Dai, J., Li, Y., He, K., et al.: R-fcn: object detection via region-based fully convolutional networks. Adv. Neural Inform. Process. Syst. (2016). https:\/\/doi.org\/10.5555\/3157096.3157139","journal-title":"Adv. Neural Inform. Process. Syst."},{"key":"1520_CR12","doi-asserted-by":"publisher","unstructured":"Dai, J., Qi, H., Xiong, Y., et\u00a0al.: Deformable convolutional networks. In: Proceedings of the IEEE International Conference on Computer Vision, pp 764\u2013773, https:\/\/doi.org\/10.1109\/ICCV.2017.89 (2017)","DOI":"10.1109\/ICCV.2017.89"},{"key":"1520_CR13","doi-asserted-by":"publisher","unstructured":"Dave, A., Khurana, T., Tokmakov, P., et\u00a0al.: Tao: a large-scale benchmark for tracking any object. In: European Conference on Computer Vision, Springer, pp 436\u2013454, https:\/\/doi.org\/10.1007\/978-3-030-58558-7_26 (2020)","DOI":"10.1007\/978-3-030-58558-7_26"},{"key":"1520_CR14","doi-asserted-by":"publisher","unstructured":"Dendorfer, P., Rezatofighi, H., Milan, A., et\u00a0al.: Mot20: A benchmark for multi object tracking in crowded scenes. arXiv preprinthttps:\/\/doi.org\/10.48550\/arXiv.2003.09003 (2020)","DOI":"10.48550\/arXiv.2003.09003"},{"key":"1520_CR15","doi-asserted-by":"publisher","unstructured":"Ge, Z., Liu, S., Wang, F., et\u00a0al.: Yolox: Exceeding yolo series in 2021. arXiv preprint arXiv:2107.08430https:\/\/doi.org\/10.48550\/arXiv.2107.08430 (2021)","DOI":"10.48550\/arXiv.2107.08430"},{"issue":"11","key":"1520_CR16","doi-asserted-by":"publisher","first-page":"1231","DOI":"10.1177\/0278364913491297","volume":"32","author":"A Geiger","year":"2013","unstructured":"Geiger, A., Lenz, P., Stiller, C., et al.: Vision meets robotics: the kitti dataset. Int. J. Robot. Res. 32(11), 1231\u20131237 (2013). https:\/\/doi.org\/10.1177\/0278364913491297","journal-title":"Int. J. Robot. Res."},{"key":"1520_CR17","doi-asserted-by":"publisher","unstructured":"Girshick, R.: Fast r-cnn. In: Proceedings of the IEEE International Conference on Computer Vision, pp 1440\u20131448, https:\/\/doi.org\/10.1109\/ICCV.2015.169 (2015)","DOI":"10.1109\/ICCV.2015.169"},{"issue":"4","key":"1520_CR18","doi-asserted-by":"publisher","first-page":"447","DOI":"10.1016\/j.jksuci.2019.09.004","volume":"32","author":"N Jaouedi","year":"2020","unstructured":"Jaouedi, N., Boujnah, N., Bouhlel, M.S.: A new hybrid deep learning model for human action recognition. J. King Saud Univ.-Comput. Inform. Sci. 32(4), 447\u2013453 (2020). https:\/\/doi.org\/10.1016\/j.jksuci.2019.09.004","journal-title":"J. King Saud Univ.-Comput. Inform. Sci."},{"key":"1520_CR19","doi-asserted-by":"publisher","unstructured":"Karthik, S., Prabhu, A., Gandhi, V.: Simple unsupervised multi-object tracking. arXiv preprint arXiv:2006.02609https:\/\/doi.org\/10.48550\/arXiv.2006.02609 (2020)","DOI":"10.48550\/arXiv.2006.02609"},{"key":"1520_CR20","volume-title":"Performance Evaluation Protocol for Face, Person and Vehicle Detection and Tracking in Video Analysis and Content Extraction (vace-ii)","author":"R Kasturi","year":"2006","unstructured":"Kasturi, R., Goldgof, D., Soundararajan, P., et al.: Performance Evaluation Protocol for Face, Person and Vehicle Detection and Tracking in Video Analysis and Content Extraction (vace-ii). Computer Science & Engineering University of South Florida, Tampa (2006)"},{"key":"1520_CR21","doi-asserted-by":"publisher","first-page":"7389","DOI":"10.1109\/TIP.2020.3002345","volume":"29","author":"T Kong","year":"2020","unstructured":"Kong, T., Sun, F., Liu, H., et al.: Foveabox: beyound anchor-based object detection. IEEE Trans. Image Process. 29, 7389\u20137398 (2020). https:\/\/doi.org\/10.1109\/TIP.2020.3002345","journal-title":"IEEE Trans. Image Process."},{"key":"1520_CR22","doi-asserted-by":"publisher","unstructured":"Law, H., Deng, J.: Cornernet: detecting objects as paired keypoints. In: Proceedings of the European Conference on Computer Vision (ECCV), pp 734\u2013750, https:\/\/doi.org\/10.1007\/s11263-019-01204-1 (2018)","DOI":"10.1007\/s11263-019-01204-1"},{"key":"1520_CR23","doi-asserted-by":"publisher","unstructured":"Leal-Taix\u00e9, L., Milan, A., Reid, I., et\u00a0al.: Motchallenge 2015: Towards a benchmark for multi-target tracking. arXiv preprint arXiv:1504.01942https:\/\/doi.org\/10.48550\/arXiv.1504.01942 (2015)","DOI":"10.48550\/arXiv.1504.01942"},{"issue":"3","key":"1520_CR24","doi-asserted-by":"publisher","first-page":"592","DOI":"10.1021\/ci300493w","volume":"53","author":"GB Li","year":"2013","unstructured":"Li, G.B., Yang, L.L., Wang, W.J., et al.: Id-score: a new empirical scoring function based on a comprehensive set of descriptors related to protein-ligand interactions. J. Chem. Inf. Model. 53(3), 592\u2013600 (2013). https:\/\/doi.org\/10.1021\/ci300493w","journal-title":"J. Chem. Inf. Model."},{"issue":"2","key":"1520_CR25","doi-asserted-by":"publisher","first-page":"318","DOI":"10.1109\/TPAMI.2018.2858826","volume":"42","author":"TY Lin","year":"2020","unstructured":"Lin, T.Y., Goyal, P., Girshick, R., et al.: Focal loss for dense object detection. IEEE Trans. Pattern Anal. Mach. Intell. 42(2), 318\u2013327 (2020). https:\/\/doi.org\/10.1109\/TPAMI.2018.2858826","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"1520_CR26","doi-asserted-by":"publisher","unstructured":"Liu, W., Anguelov, D., Erhan, D., et\u00a0al.: Ssd: Single shot multibox detector. In: European Conference on Computer Vision, Springer, pp 21\u201337, https:\/\/doi.org\/10.1007\/978-3-319-46448-0_2 (2016)","DOI":"10.1007\/978-3-319-46448-0_2"},{"issue":"2","key":"1520_CR27","doi-asserted-by":"publisher","first-page":"548","DOI":"10.1007\/s11263-020-01375-2","volume":"129","author":"J Luiten","year":"2021","unstructured":"Luiten, J., Osep, A., Dendorfer, P., et al.: Hota: a higher order metric for evaluating multi-object tracking. Int. J. Comput. Vision 129(2), 548\u2013578 (2021). https:\/\/doi.org\/10.1007\/s11263-020-01375-2","journal-title":"Int. J. Comput. Vision"},{"issue":"1","key":"1520_CR28","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1038\/s41467-020-19105-0","volume":"11","author":"T Maekawa","year":"2020","unstructured":"Maekawa, T., Ohara, K., Zhang, Y., et al.: Deep learning-assisted comparative analysis of animal trajectories with deephl. Nat. Commun. 11(1), 1\u201315 (2020). https:\/\/doi.org\/10.1038\/s41467-020-19105-0","journal-title":"Nat. Commun."},{"key":"1520_CR29","doi-asserted-by":"publisher","unstructured":"Milan, A., Leal-Taix\u00e9, L., Reid, I., et\u00a0al.: Mot16: a benchmark for multi-object tracking. arXiv preprint arXiv:1603.00831https:\/\/doi.org\/10.48550\/arXiv.1603.00831 (2016)","DOI":"10.48550\/arXiv.1603.00831"},{"key":"1520_CR30","doi-asserted-by":"publisher","unstructured":"Pang, B., Li, Y., Zhang, Y., et\u00a0al.: Tubetk: Adopting tubes to track multi-object in a one-step training model. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 6308\u20136318, https:\/\/doi.org\/10.1109\/CVPR42600.2020.00634 (2020)","DOI":"10.1109\/CVPR42600.2020.00634"},{"key":"1520_CR31","doi-asserted-by":"publisher","unstructured":"Papakis, I., Sarkar, A., Karpatne, A.: A graph convolutional neural network based approach for traffic monitoring using augmented detections with optical flow. In: 2021 IEEE International Intelligent Transportation Systems Conference (ITSC), IEEE, pp 2980\u20132986, https:\/\/doi.org\/10.48550\/arXiv.2010.00067 (2021)","DOI":"10.48550\/arXiv.2010.00067"},{"key":"1520_CR32","doi-asserted-by":"publisher","unstructured":"Pedersen, M., Haurum, J.B., Dendorfer, P., et\u00a0al.: MOTCOM: the multi-object tracking dataset complexity metric. In: Avidan, S., Brostow, G., Ciss\u00e9, M., et\u00a0al (eds) Computer Vision - ECCV 2022. Springer Nature Switzerland, Cham, Lecture Notes in Computer Science, pp 20\u201337, https:\/\/doi.org\/10.1007\/978-3-031-20074-8_2 (2022)","DOI":"10.1007\/978-3-031-20074-8_2"},{"key":"1520_CR33","doi-asserted-by":"publisher","unstructured":"Peng, J., Wang, C., Wan, F., et\u00a0al.: Chained-tracker: chaining paired attentive regression results for end-to-end joint multiple-object detection and tracking. In: European Conference on Computer Vision, Springer, pp 145\u2013161, https:\/\/doi.org\/10.1007\/978-3-030-58548-8_9 (2020)","DOI":"10.1007\/978-3-030-58548-8_9"},{"key":"1520_CR34","doi-asserted-by":"publisher","unstructured":"Redmon, J., Farhadi, A.: Yolov3: An incremental improvement. arXiv preprint arXiv:1804.02767https:\/\/doi.org\/10.48550\/arXiv.1804.02767 (2018)","DOI":"10.48550\/arXiv.1804.02767"},{"issue":"6","key":"1520_CR35","doi-asserted-by":"publisher","first-page":"843","DOI":"10.1109\/TAC.1979.1102177","volume":"24","author":"D Reid","year":"1979","unstructured":"Reid, D.: An algorithm for tracking multiple targets. IEEE Trans. Autom. Control 24(6), 843\u2013854 (1979). https:\/\/doi.org\/10.1109\/TAC.1979.1102177","journal-title":"IEEE Trans. Autom. Control"},{"key":"1520_CR36","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2577031","author":"S Ren","year":"2015","unstructured":"Ren, S., He, K., Girshick, R., et al.: Faster r-cnn: towards real-time object detection with region proposal networks. Adv. Neural Inform. Process. Syst. (2015). https:\/\/doi.org\/10.1109\/TPAMI.2016.2577031","journal-title":"Adv. Neural Inform. Process. Syst."},{"key":"1520_CR37","doi-asserted-by":"publisher","first-page":"1439","DOI":"10.1109\/TIP.2020.3044219","volume":"30","author":"W Ren","year":"2020","unstructured":"Ren, W., Wang, X., Tian, J., et al.: Tracking-by-counting: using network flows on crowd density maps for tracking multiple targets. IEEE Trans. Image Process. 30, 1439\u20131452 (2020). https:\/\/doi.org\/10.1109\/TIP.2020.3044219","journal-title":"IEEE Trans. Image Process."},{"key":"1520_CR38","doi-asserted-by":"publisher","unstructured":"Schulter, S., Vernaza, P., Choi, W., et\u00a0al.: Deep network flow for multi-object tracking. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp 6951\u20136960, https:\/\/doi.org\/10.1109\/CVPR.2017.292 (2017)","DOI":"10.1109\/CVPR.2017.292"},{"key":"1520_CR39","doi-asserted-by":"publisher","unstructured":"Shao, S., Zhao, Z., Li, B., et\u00a0al.: Crowdhuman: A benchmark for detecting human in a crowd. arXiv preprint arXiv:1805.00123https:\/\/doi.org\/10.48550\/arXiv.1805.00123 (2018)","DOI":"10.48550\/arXiv.1805.00123"},{"key":"1520_CR40","doi-asserted-by":"publisher","unstructured":"Sun, P., Cao, J., Jiang, Y., et\u00a0al.: Transtrack: Multiple object tracking with transformer. arXiv preprint arXiv:2012.15460https:\/\/doi.org\/10.48550\/arXiv.2012.15460 (2020)","DOI":"10.48550\/arXiv.2012.15460"},{"key":"1520_CR41","doi-asserted-by":"publisher","unstructured":"Tian, Z., Shen, C., Chen, H., et\u00a0al.: Fcos: Fully convolutional one-stage object detection. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 9627\u20139636, https:\/\/doi.org\/10.1109\/CVPR.2019.00094 (2019)","DOI":"10.1109\/CVPR.2019.00094"},{"key":"1520_CR42","doi-asserted-by":"publisher","unstructured":"Vaswani, A., Shazeer, N., Parmar, N., et\u00a0al.: Attention is all you need. Advances in neural information processing systems 30. https:\/\/doi.org\/10.48550\/arXiv.1706.03762 (2017)","DOI":"10.48550\/arXiv.1706.03762"},{"key":"1520_CR43","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2022.3140919","author":"G Wang","year":"2022","unstructured":"Wang, G., Wang, Y., Gu, R., et al.: Split and connect: a universal tracklet booster for multi-object tracking. IEEE Trans. Multimedia (2022). https:\/\/doi.org\/10.1109\/TMM.2022.3140919","journal-title":"IEEE Trans. Multimedia"},{"key":"1520_CR44","doi-asserted-by":"publisher","unstructured":"Wang, Q., Zheng, Y., Pan, P., et\u00a0al.: Multiple object tracking with correlation learning. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 3876\u20133886, https:\/\/doi.org\/10.1109\/CVPR46437.2021.00387 (2021a)","DOI":"10.1109\/CVPR46437.2021.00387"},{"key":"1520_CR45","doi-asserted-by":"publisher","unstructured":"Wang, Y., Kitani, K., Weng, X.: Joint object detection and multi-object tracking with graph neural networks. In: 2021 IEEE International Conference on Robotics and Automation (ICRA). IEEE Press, p 13708-13715, https:\/\/doi.org\/10.1109\/ICRA48506.2021.9561110, (2021b)","DOI":"10.1109\/ICRA48506.2021.9561110"},{"key":"1520_CR46","doi-asserted-by":"publisher","unstructured":"Wang, Z., Zheng, L., Liu, Y., et\u00a0al.: Towards real-time multi-object tracking. In: European Conference on Computer Vision, Springer, pp 107\u2013122, https:\/\/doi.org\/10.1007\/978-3-030-58621-8_7 (2020)","DOI":"10.1007\/978-3-030-58621-8_7"},{"key":"1520_CR47","doi-asserted-by":"publisher","unstructured":"Wojke, N., Bewley, A., Paulus, D.: Simple online and realtime tracking with a deep association metric. In: 2017 IEEE International Conference on Image Processing (ICIP), IEEE, pp 3645\u20133649, https:\/\/doi.org\/10.1109\/icip.2017.8296962 (2017)","DOI":"10.1109\/icip.2017.8296962"},{"key":"1520_CR48","doi-asserted-by":"publisher","unstructured":"Wu, J., Cao, J., Song, L., et\u00a0al.: Track to detect and segment: An online multi-object tracker. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), pp 12352\u201312361, https:\/\/doi.org\/10.48550\/arXiv.2103.08808 (2021)","DOI":"10.48550\/arXiv.2103.08808"},{"key":"1520_CR49","doi-asserted-by":"publisher","unstructured":"Xu, Y., Ban, Y., Delorme, G., et\u00a0al.: Transcenter: Transformers with dense representations for multiple-object tracking. IEEE Transactions on Pattern Analysis and Machine Intelligence pp 1\u201316. https:\/\/doi.org\/10.1109\/TPAMI.2022.3225078 (2022)","DOI":"10.1109\/TPAMI.2022.3225078"},{"issue":"6","key":"1520_CR50","doi-asserted-by":"publisher","first-page":"7820","DOI":"10.1109\/TPAMI.2022.3225078","volume":"45","author":"Y Xu","year":"2023","unstructured":"Xu, Y., Ban, Y., Delorme, G., et al.: Transcenter: transformers with dense representations for multiple-object tracking. IEEE Trans. Pattern Anal. Mach. Intell. 45(6), 7820\u20137835 (2023). https:\/\/doi.org\/10.1109\/TPAMI.2022.3225078","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"1520_CR51","doi-asserted-by":"publisher","unstructured":"Zhang, H., Chang, H., Ma, B., et\u00a0al.: Cascade retinanet: Maintaining consistency for single-stage object detection. British Machine Vision Conference https:\/\/doi.org\/10.48550\/arXiv.1907.06881, https:\/\/api.semanticscholar.org\/CorpusID:196831468 (2019)","DOI":"10.48550\/arXiv.1907.06881"},{"key":"1520_CR52","doi-asserted-by":"publisher","unstructured":"Zhang, L., Li, Y., Nevatia, R.: Global data association for multi-object tracking using network flows. In: 2008 IEEE Conference on Computer Vision and Pattern Recognition, IEEE, pp 1\u20138, https:\/\/doi.org\/10.1109\/CVPR.2008.4587584 (2008)","DOI":"10.1109\/CVPR.2008.4587584"},{"issue":"9","key":"1520_CR53","doi-asserted-by":"publisher","first-page":"7892","DOI":"10.1109\/JIOT.2020.2996609","volume":"7","author":"Y Zhang","year":"2020","unstructured":"Zhang, Y., Sheng, H., Wu, Y., et al.: Multiplex labeling graph for near-online tracking in crowded scenes. IEEE Internet Things J. 7(9), 7892\u20137902 (2020). https:\/\/doi.org\/10.1109\/JIOT.2020.2996609","journal-title":"IEEE Internet Things J."},{"issue":"11","key":"1520_CR54","doi-asserted-by":"publisher","first-page":"3069","DOI":"10.1007\/S11263-021-01513-4","volume":"129","author":"Y Zhang","year":"2021","unstructured":"Zhang, Y., Wang, C., Wang, X., et al.: Fairmot: on the fairness of detection and re-identification in multiple object tracking. Int. J. Comput. Vision 129(11), 3069\u20133087 (2021). https:\/\/doi.org\/10.1007\/S11263-021-01513-4","journal-title":"Int. J. Comput. Vision"},{"key":"1520_CR55","doi-asserted-by":"crossref","unstructured":"Zhang, Y., Sun, P., Jiang, Y., et al.: Bytetrack: Multi-object tracking by associating every detection box. In: Avidan, S., Brostow, G., Ciss\u00e9, M., et al. (eds.) Computer Vision - ECCV 2022, pp. 1\u201321. Springer Nature Switzerland, Cham (2022)","DOI":"10.1007\/978-3-031-20047-2_1"},{"key":"1520_CR56","doi-asserted-by":"publisher","unstructured":"Zhang, Z., Cheng, D., Zhu, X., et\u00a0al.: Integrated object detection and tracking with tracklet-conditioned detection. arXiv preprint arXiv:1811.11167https:\/\/doi.org\/10.48550\/arXiv.1811.11167 (2018)","DOI":"10.48550\/arXiv.1811.11167"},{"key":"1520_CR57","doi-asserted-by":"publisher","unstructured":"Zhou, X., Wang, D., Kr\u00e4henb\u00fchl, P.: Objects as points. arXiv preprint arXiv:1904.07850https:\/\/doi.org\/10.48550\/arxiv.1904.07850 (2019a)","DOI":"10.48550\/arxiv.1904.07850"},{"key":"1520_CR58","doi-asserted-by":"publisher","unstructured":"Zhou, X., Zhuo, J., Krahenbuhl, P.: Bottom-up object detection by grouping extreme and center points. In: Proceedings of the IEEE\/CVF conference on Computer Vision and Pattern Recognition, pp 850\u2013859, https:\/\/doi.org\/10.1109\/CVPR.2019.00094 (2019b)","DOI":"10.1109\/CVPR.2019.00094"},{"key":"1520_CR59","doi-asserted-by":"publisher","unstructured":"Zhou, X., Koltun, V., Kr\u00e4henb\u00fchl, P.: Tracking objects as points. In: European Conference on Computer Vision, Springer, pp 474\u2013490, https:\/\/doi.org\/10.1007\/978-3-030-58548-8_28 (2020)","DOI":"10.1007\/978-3-030-58548-8_28"}],"container-title":["Machine Vision and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00138-024-01520-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00138-024-01520-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00138-024-01520-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,5,14]],"date-time":"2024-05-14T04:22:53Z","timestamp":1715660573000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00138-024-01520-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,4,15]]},"references-count":59,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2024,5]]}},"alternative-id":["1520"],"URL":"https:\/\/doi.org\/10.1007\/s00138-024-01520-8","relation":{},"ISSN":["0932-8092","1432-1769"],"issn-type":[{"type":"print","value":"0932-8092"},{"type":"electronic","value":"1432-1769"}],"subject":[],"published":{"date-parts":[[2024,4,15]]},"assertion":[{"value":"26 March 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"23 December 2023","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"6 February 2024","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 April 2024","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"None","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"54"}}