{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T17:51:18Z","timestamp":1740160278576,"version":"3.37.3"},"reference-count":85,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2024,5,2]],"date-time":"2024-05-02T00:00:00Z","timestamp":1714608000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,5,2]],"date-time":"2024-05-02T00:00:00Z","timestamp":1714608000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"crossref","award":["62371208","62371208","62371208","62371208"],"award-info":[{"award-number":["62371208","62371208","62371208","62371208"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100002858","name":"China Postdoctoral Science Foundation","doi-asserted-by":"publisher","award":["2015M581720","2015M581720","2015M581720","2015M581720"],"award-info":[{"award-number":["2015M581720","2015M581720","2015M581720","2015M581720"]}],"id":[{"id":"10.13039\/501100002858","id-type":"DOI","asserted-by":"publisher"}]},{"name":"111 Projects","award":["B12018","B12018","B12018","B12018"],"award-info":[{"award-number":["B12018","B12018","B12018","B12018"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int. J. Mach. Learn. &amp; Cyber."],"published-print":{"date-parts":[[2025,1]]},"DOI":"10.1007\/s13042-024-02182-8","type":"journal-article","created":{"date-parts":[[2024,5,2]],"date-time":"2024-05-02T08:01:49Z","timestamp":1714636909000},"page":"143-158","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Igtracker: task and instance information gaps in multiple object tracking"],"prefix":"10.1007","volume":"16","author":[{"given":"Jialin","family":"Liu","sequence":"first","affiliation":[]},{"given":"Jun","family":"Kong","sequence":"additional","affiliation":[]},{"given":"Min","family":"Jiang","sequence":"additional","affiliation":[]},{"given":"Danfeng","family":"Zhuang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,5,2]]},"reference":[{"key":"2182_CR1","doi-asserted-by":"publisher","first-page":"3053","DOI":"10.1007\/s13042-020-01220-5","volume":"12","author":"I Ahmed","year":"2021","unstructured":"Ahmed I, Ahmad M, Ahmad A, Jeon G (2021) Top view multiple people tracking by detection using deep sort and yolov3 with transfer learning: within 5g infrastructure. Int J Mach Learn Cybern 12:3053\u20133067","journal-title":"Int J Mach Learn Cybern"},{"key":"2182_CR2","doi-asserted-by":"crossref","unstructured":"Oh S, Hoogs A, Perera A, Cuntoor N, Chen C-C, Lee JT, Mukherjee S, Aggarwal J, Lee H, Davis L (2011) A large-scale benchmark dataset for event recognition in surveillance video. In: CVPR 2011, pp. 3153\u20133160. IEEE","DOI":"10.1109\/CVPR.2011.5995586"},{"issue":"1","key":"2182_CR3","doi-asserted-by":"publisher","DOI":"10.1016\/j.ipm.2021.102736","volume":"59","author":"C Shao","year":"2022","unstructured":"Shao C, Yang Y, Juneja SG, Seetharam T (2022) Iot data visualization for business intelligence in corporate finance. Inf Process Manag 59(1):102736","journal-title":"Inf Process Manag"},{"issue":"1","key":"2182_CR4","first-page":"241","volume":"70","author":"Z Liu","year":"2022","unstructured":"Liu Z, Zhang O, Gao Y, Zhao Y, Sun Y, Liu J (2022) Adaptive neural network-based fixed-time control for trajectory tracking of robotic systems. IEEE Trans Circ Syst II Express Briefs 70(1):241\u2013245","journal-title":"IEEE Trans Circ Syst II Express Briefs"},{"key":"2182_CR5","doi-asserted-by":"publisher","DOI":"10.1016\/j.rcim.2022.102476","volume":"80","author":"S Tan","year":"2023","unstructured":"Tan S, Yang J, Ding H (2023) A prediction and compensation method of robot tracking error considering pose-dependent load decomposition. Robot Comput-Integr Manuf 80:102476","journal-title":"Robot Comput-Integr Manuf"},{"key":"2182_CR6","doi-asserted-by":"crossref","unstructured":"Janai J, G\u00fcney F, Behl A, Geiger A (2020) Computer vision for autonomous vehicles: problems, datasets and state of the art. Found Trends\u00ae Comput Graph Vis 12(1\u20133):1\u2013308","DOI":"10.1561\/0600000079"},{"key":"2182_CR7","doi-asserted-by":"crossref","unstructured":"Sun P, Kretzschmar H, Dotiwalla X, Chouard A, Patnaik V, Tsui P, Guo J, Zhou Y, Chai Y, Caine B (2020) Scalability in perception for autonomous driving: Waymo open dataset. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 2446\u20132454","DOI":"10.1109\/CVPR42600.2020.00252"},{"key":"2182_CR8","doi-asserted-by":"crossref","unstructured":"Yu F, Chen H, Wang X, Xian W, Chen Y, Liu F, Madhavan V, Darrell T (2020) Bdd100k: A diverse driving dataset for heterogeneous multitask learning. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 2636\u20132645","DOI":"10.1109\/CVPR42600.2020.00271"},{"key":"2182_CR9","unstructured":"Leal-Taix\u00e9 L, Milan A, Reid I, Roth S, Schindler K (2015) Motchallenge 2015: Towards a benchmark for multi-target tracking"},{"key":"2182_CR10","unstructured":"Milan A, Leal-Taix\u00e9 L, Reid I, Roth S, Schindler K (2016) MOT16: A benchmark for multi-object tracking"},{"key":"2182_CR11","unstructured":"Dendorfer P, Rezatofighi H, Milan A, Shi J, Cremers D, Reid I, Roth S, Schindler K, Leal-Taix\u00e9 L (2020) Mot20: A benchmark for multi object tracking in crowded scenes"},{"key":"2182_CR12","doi-asserted-by":"crossref","unstructured":"Bewley A, Ge Z, Ott L, Ramos F, Upcroft B (2016) Simple online and realtime tracking. In: 2016 IEEE International Conference on Image Processing (ICIP), pp. 3464\u20133468. IEEE","DOI":"10.1109\/ICIP.2016.7533003"},{"key":"2182_CR13","doi-asserted-by":"crossref","unstructured":"Wojke N, Bewley A, Paulus D (2017) Simple online and realtime tracking with a deep association metric. In: 2017 IEEE International Conference on Image Processing (ICIP), pp. 3645\u20133649. IEEE","DOI":"10.1109\/ICIP.2017.8296962"},{"key":"2182_CR14","doi-asserted-by":"crossref","unstructured":"Yu F, Li W, Li Q, Liu Y, Shi X, Yan J (2016) Poi: Multiple object tracking with high performance detection and appearance feature. In: Computer Vision\u2013ECCV 2016 Workshops: Amsterdam, The Netherlands, October 8-10 and 15-16, 2016, Proceedings, Part II 14, pp. 36\u201342. Springer","DOI":"10.1007\/978-3-319-48881-3_3"},{"issue":"5","key":"2182_CR15","doi-asserted-by":"publisher","first-page":"1183","DOI":"10.1109\/TMM.2018.2875360","volume":"21","author":"Q Zhou","year":"2018","unstructured":"Zhou Q, Zhong B, Zhang Y, Li J, Fu Y (2018) Deep alignment network based multi-person tracking with occlusion and motion reasoning. IEEE Trans Multimedia 21(5):1183\u20131194","journal-title":"IEEE Trans Multimedia"},{"issue":"7","key":"2182_CR16","doi-asserted-by":"publisher","first-page":"1709","DOI":"10.1109\/TMM.2018.2885922","volume":"21","author":"P Dai","year":"2018","unstructured":"Dai P, Wang X, Zhang W, Chen J (2018) Instance segmentation enabled hybrid data association and discriminative hashing for online multi-object tracking. IEEE Trans Multimedia 21(7):1709\u20131723","journal-title":"IEEE Trans Multimedia"},{"issue":"10","key":"2182_CR17","doi-asserted-by":"publisher","first-page":"2825","DOI":"10.1007\/s13042-022-01564-0","volume":"13","author":"K Tan","year":"2022","unstructured":"Tan K, Xu T-B, Wei Z (2022) Online visual tracking via background-aware siamese networks. Int J Mach Learn Cybern 13(10):2825\u20132842","journal-title":"Int J Mach Learn Cybern"},{"key":"2182_CR18","doi-asserted-by":"crossref","unstructured":"Doll\u00e1r P, Wojek C, Schiele B, Perona P (2009) Pedestrian detection: A benchmark. In: 2009 IEEE Conference on Computer Vision and Pattern Recognition, pp. 304\u2013311. IEEE","DOI":"10.1109\/CVPR.2009.5206631"},{"key":"2182_CR19","doi-asserted-by":"crossref","unstructured":"Leibe B, Seemann E, Schiele B (2005) Pedestrian detection in crowded scenes. In: 2005 IEEE Computer Society Conference on Computer Vision and Pattern Recognition (CVPR\u201905), vol. 1, pp. 878\u2013885. IEEE","DOI":"10.1109\/CVPR.2005.272"},{"issue":"8","key":"2182_CR20","doi-asserted-by":"publisher","first-page":"2153","DOI":"10.1007\/s13042-022-01512-y","volume":"13","author":"L Chen","year":"2022","unstructured":"Chen L, Liu H, Mo J, Zhang D, Yang J, Lin F, Zheng Z, Jia R (2022) Cross channel aggregation similarity network for salient object detection. Int J Mach Learn Cybern 13(8):2153\u20132169","journal-title":"Int J Mach Learn Cybern"},{"key":"2182_CR21","doi-asserted-by":"crossref","unstructured":"He S, Luo H, Wang P, Wang F, Li H, Jiang W (2021) Transreid: Transformer-based object re-identification. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 15013\u201315022","DOI":"10.1109\/ICCV48922.2021.01474"},{"key":"2182_CR22","doi-asserted-by":"crossref","unstructured":"Ren M, He L, Liao X, Liu W, Wang Y, Tan T (2021) Learning instance-level spatial-temporal patterns for person re-identification. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 14930\u201314939","DOI":"10.1109\/ICCV48922.2021.01466"},{"issue":"11","key":"2182_CR23","doi-asserted-by":"publisher","first-page":"3523","DOI":"10.1007\/s13042-022-01610-x","volume":"13","author":"X Luo","year":"2022","unstructured":"Luo X, Jiang M, Kong J (2022) Selective relation-aware representations for person re-identification. Int J Mach Learn Cybern 13(11):3523\u20133541","journal-title":"Int J Mach Learn Cybern"},{"issue":"8","key":"2182_CR24","doi-asserted-by":"publisher","first-page":"3703","DOI":"10.1109\/TIP.2018.2818018","volume":"27","author":"X Zhang","year":"2018","unstructured":"Zhang X, Cheng L, Li B, Hu H-M (2018) Too far to see? not really!-pedestrian detection with scale-aware localization policy. IEEE Trans Image Process 27(8):3703\u20133715. https:\/\/doi.org\/10.1109\/TIP.2018.2818018","journal-title":"IEEE Trans Image Process"},{"key":"2182_CR25","unstructured":"Xiaowei Z, Jianwei M, Hong L, Hai-Miao H, Peng Y (2022) Dual attentional siamese network for visual tracking. Displays: Technology and Applications"},{"key":"2182_CR26","doi-asserted-by":"crossref","unstructured":"Zhang X, Li L, Liu H, Yang P, Gao Y(2022) Disentangling classification and regression in siamese-based network for visual tracking. Concurrency and Computation: Practice and Experience 34","DOI":"10.1002\/cpe.7246"},{"key":"2182_CR27","doi-asserted-by":"publisher","first-page":"3069","DOI":"10.1007\/s11263-021-01513-4","volume":"129","author":"Y Zhang","year":"2021","unstructured":"Zhang Y, Wang C, Wang X, Zeng W, Liu W (2021) Fairmot: On the fairness of detection and re-identification in multiple object tracking. Int J Comput Vision 129:3069\u20133087","journal-title":"Int J Comput Vision"},{"key":"2182_CR28","doi-asserted-by":"crossref","unstructured":"Li M, Wu J, Wang X, Chen C, Qin J, Xiao X, Wang R, Zheng M, Pan X (2023) AlignDet: Aligning Pre-training and Fine-tuning in Object Detection","DOI":"10.1109\/ICCV51070.2023.00632"},{"key":"2182_CR29","doi-asserted-by":"crossref","unstructured":"Wang Z, Zheng L, Liu Y, Li Y, Wang S (2020) Towards real-time multi-object tracking. In: European Conference on Computer Vision, pp. 107\u2013122. Springer","DOI":"10.1007\/978-3-030-58621-8_7"},{"key":"2182_CR30","doi-asserted-by":"crossref","unstructured":"Bergmann P, Meinhardt T, Leal-Taixe L (2019) Tracking without bells and whistles. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 941\u2013951","DOI":"10.1109\/ICCV.2019.00103"},{"key":"2182_CR31","doi-asserted-by":"crossref","unstructured":"Lu Z, Rathod V, Votel R, Huang J (2020) Retinatrack: Online single stage joint detection and tracking. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 14668\u201314678","DOI":"10.1109\/CVPR42600.2020.01468"},{"key":"2182_CR32","doi-asserted-by":"publisher","first-page":"3182","DOI":"10.1109\/TIP.2022.3165376","volume":"31","author":"C Liang","year":"2022","unstructured":"Liang C, Zhang Z, Zhou X, Li B, Zhu S, Hu W (2022) Rethinking the competition between detection and reid in multiobject tracking. IEEE Trans Image Process 31:3182\u20133196","journal-title":"IEEE Trans Image Process"},{"key":"2182_CR33","doi-asserted-by":"crossref","unstructured":"Yu E, Li Z, Han S, Wang H (2022) Relationtrack: Relation-aware multiple object tracking with decoupled representation. IEEE Transactions on Multimedia","DOI":"10.1109\/TMM.2022.3150169"},{"key":"2182_CR34","doi-asserted-by":"publisher","unstructured":"Zhou C, Jiang M, Kong J (2023) Bgtracker: Cross-task bidirectional guidance strategy for multiple object tracking. IEEE Transactions on Multimedia 25, 8132\u20138144 https:\/\/doi.org\/10.1109\/TMM.2023.3256761","DOI":"10.1109\/TMM.2023.3256761"},{"issue":"5","key":"2182_CR35","doi-asserted-by":"publisher","first-page":"053007","DOI":"10.1117\/1.JEI.32.5.053007","volume":"32","author":"E Mo","year":"2023","unstructured":"Mo E, Kong J, Jiang M, Liu T (2023) Motion information supplement for joint detection and embedding tracking. J Electron Imaging 32(5):053007\u2013053007","journal-title":"J Electron Imaging"},{"key":"2182_CR36","doi-asserted-by":"publisher","unstructured":"Liu J, Kong J, Jiang M, Liu T (2023) Caltracker: Cross-task association learning for multiple object tracking. IEEE Signal Processing Letters 30, 1622\u20131626 https:\/\/doi.org\/10.1109\/LSP.2023.3329419","DOI":"10.1109\/LSP.2023.3329419"},{"key":"2182_CR37","doi-asserted-by":"crossref","unstructured":"Duan K, Bai S, Xie L, Qi H, Huang Q, Tian Q (2019) Centernet: Keypoint triplets for object detection. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 6569\u20136578","DOI":"10.1109\/ICCV.2019.00667"},{"key":"2182_CR38","doi-asserted-by":"crossref","unstructured":"Yang Z, Liu S, Hu H, Wang L, Lin S (2019) Reppoints: Point set representation for object detection. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 9657\u20139666","DOI":"10.1109\/ICCV.2019.00975"},{"key":"2182_CR39","doi-asserted-by":"crossref","unstructured":"Law H, Deng J (2018) Cornernet: Detecting objects as paired keypoints. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 734\u2013750","DOI":"10.1007\/978-3-030-01264-9_45"},{"key":"2182_CR40","doi-asserted-by":"crossref","unstructured":"Dong Z, Li G, Liao Y, Wang F, Ren P, Qian C (2020) Centripetalnet: Pursuing high-quality keypoint pairs for object detection. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10519\u201310528","DOI":"10.1109\/CVPR42600.2020.01053"},{"key":"2182_CR41","doi-asserted-by":"crossref","unstructured":"Duan K, Xie L, Qi H, Bai S, Huang Q, Tian Q (2020) Corner proposal network for anchor-free, two-stage object detection. In: European Conference on Computer Vision, pp. 399\u2013416. Springer","DOI":"10.1007\/978-3-030-58580-8_24"},{"key":"2182_CR42","doi-asserted-by":"crossref","unstructured":"Lan S, Ren Z, Wu Y, Davis LS, Hua G (2020) Saccadenet: A fast and accurate object detector. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10397\u201310406","DOI":"10.1109\/CVPR42600.2020.01041"},{"key":"2182_CR43","doi-asserted-by":"publisher","first-page":"995","DOI":"10.1109\/TMM.2021.3062489","volume":"24","author":"T Gao","year":"2021","unstructured":"Gao T, Pan H, Wang Z, Gao H (2021) A crf-based framework for tracklet inactivation in online multi-object tracking. IEEE Trans Multimedia 24:995\u20131007","journal-title":"IEEE Trans Multimedia"},{"key":"2182_CR44","doi-asserted-by":"crossref","unstructured":"Guo M, Haque A, Huang D-A, Yeung S, Fei-Fei L (2018) Dynamic task prioritization for multitask learning. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 270\u2013287","DOI":"10.1007\/978-3-030-01270-0_17"},{"key":"2182_CR45","unstructured":"Ren S, He K, Girshick R, Sun J (2015) Faster r-cnn: Towards real-time object detection with region proposal networks. Advances in neural information processing systems 28"},{"key":"2182_CR46","doi-asserted-by":"crossref","unstructured":"Yang F, Choi W, Lin Y (2016) Exploit all the layers: Fast and accurate cnn object detector with scale dependent pooling and cascaded rejection classifiers. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2129\u20132137","DOI":"10.1109\/CVPR.2016.234"},{"key":"2182_CR47","unstructured":"Redmon J, Farhadi A (2018) Yolov3: An incremental improvement"},{"key":"2182_CR48","doi-asserted-by":"crossref","unstructured":"Liu W, Anguelov D, Erhan D, Szegedy C, Reed S, Fu C-Y, Berg AC (2016) Ssd: Single shot multibox detector. In: Computer Vision\u2013ECCV 2016: 14th European Conference, Amsterdam, The Netherlands, October 11\u201314, 2016, Proceedings, Part I 14, pp. 21\u201337. Springer","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"2182_CR49","doi-asserted-by":"crossref","unstructured":"Kalman RE (1960) A new approach to linear filtering and prediction problems","DOI":"10.1115\/1.3662552"},{"key":"2182_CR50","doi-asserted-by":"crossref","unstructured":"Bochinski E, Eiselein V, Sikora T (2017) High-speed tracking-by-detection without using image information. In: 2017 14th IEEE International Conference on Advanced Video and Signal Based Surveillance (AVSS), pp. 1\u20136. IEEE","DOI":"10.1109\/AVSS.2017.8078516"},{"key":"2182_CR51","doi-asserted-by":"crossref","unstructured":"Bochinski E, Senst T, Sikora T (2018) Extending iou based multi-object tracking by visual information. In: 2018 15th IEEE International Conference on Advanced Video and Signal Based Surveillance (AVSS), pp. 1\u20136. IEEE","DOI":"10.1109\/AVSS.2018.8639144"},{"key":"2182_CR52","doi-asserted-by":"crossref","unstructured":"Zhu X, Wang Y, Dai J, Yuan L, Wei Y (2017) Flow-guided feature aggregation for video object detection. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 408\u2013417","DOI":"10.1109\/ICCV.2017.52"},{"key":"2182_CR53","doi-asserted-by":"crossref","unstructured":"Guo S, Wang J, Wang X, Tao D (2021) Online multiple object tracking with cross-task synergy. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 8136\u20138145","DOI":"10.1109\/CVPR46437.2021.00804"},{"key":"2182_CR54","doi-asserted-by":"crossref","unstructured":"Voigtlaender P, Krause M, Osep A, Luiten J, Sekar BBG, Geiger A, Leibe B (2019) Mots: Multi-object tracking and segmentation. In: Proceedings of the Ieee\/cvf Conference on Computer Vision and Pattern Recognition, pp. 7942\u20137951","DOI":"10.1109\/CVPR.2019.00813"},{"key":"2182_CR55","doi-asserted-by":"crossref","unstructured":"He K, Gkioxari G, Doll\u00e1r P, Girshick R (2017) Mask r-cnn. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 2961\u20132969","DOI":"10.1109\/ICCV.2017.322"},{"key":"2182_CR56","doi-asserted-by":"crossref","unstructured":"Zhou X, Koltun V, Kr\u00e4henb\u00fchl P (2020) Tracking objects as points. In: European Conference on Computer Vision, pp. 474\u2013490. Springer","DOI":"10.1007\/978-3-030-58548-8_28"},{"key":"2182_CR57","doi-asserted-by":"crossref","unstructured":"Xia Z, Pan X, Song S, Li LE, Huang G (2022) Vision transformer with deformable attention. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4794\u20134803","DOI":"10.1109\/CVPR52688.2022.00475"},{"key":"2182_CR58","unstructured":"Vaswani A, Shazeer N, Parmar N, Uszkoreit J, Jones L, Gomez AN, Kaiser \u0141, Polosukhin I (2017) Attention is all you need. Advances in neural information processing systems 30"},{"key":"2182_CR59","doi-asserted-by":"crossref","unstructured":"Yu F, Wang D, Shelhamer E, Darrell T (2018) Deep layer aggregation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2403\u20132412","DOI":"10.1109\/CVPR.2018.00255"},{"key":"2182_CR60","doi-asserted-by":"crossref","unstructured":"Dai J, Qi H, Xiong Y, Li Y, Zhang G, Hu H, Wei Y (2017) Deformable convolutional networks. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 764\u2013773","DOI":"10.1109\/ICCV.2017.89"},{"issue":"1\u20132","key":"2182_CR61","doi-asserted-by":"publisher","first-page":"83","DOI":"10.1002\/nav.3800020109","volume":"2","author":"HW Kuhn","year":"1955","unstructured":"Kuhn HW (1955) The hungarian method for the assignment problem. Naval research logistics quarterly 2(1\u20132):83\u201397","journal-title":"Naval research logistics quarterly"},{"issue":"1\u20134","key":"2182_CR62","doi-asserted-by":"publisher","first-page":"53","DOI":"10.1007\/s13042-010-0002-z","volume":"1","author":"LI Kuncheva","year":"2010","unstructured":"Kuncheva LI (2010) Full-class set classification using the hungarian algorithm. Int J Mach Learn Cybern 1(1\u20134):53\u201361","journal-title":"Int J Mach Learn Cybern"},{"key":"2182_CR63","doi-asserted-by":"crossref","unstructured":"Hou Q, Zhou D, Feng J (2021) Coordinate attention for efficient mobile network design. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 13713\u201313722","DOI":"10.1109\/CVPR46437.2021.01350"},{"key":"2182_CR64","first-page":"15475","volume":"34","author":"Q Zhang","year":"2021","unstructured":"Zhang Q, Yang Y-B (2021) Rest: An efficient transformer for visual recognition. Adv Neural Inf Process Syst 34:15475\u201315485","journal-title":"Adv Neural Inf Process Syst"},{"key":"2182_CR65","doi-asserted-by":"crossref","unstructured":"Chollet F (2017) Xception: Deep learning with depthwise separable convolutions. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1251\u20131258","DOI":"10.1109\/CVPR.2017.195"},{"key":"2182_CR66","doi-asserted-by":"crossref","unstructured":"Zhang Q-L, Yang Y-B (2021) Sa-net: Shuffle attention for deep convolutional neural networks. In: ICASSP 2021-2021 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 2235\u20132239. IEEE","DOI":"10.1109\/ICASSP39728.2021.9414568"},{"key":"2182_CR67","doi-asserted-by":"crossref","unstructured":"Li D, Hu J, Wang C, Li X, She Q, Zhu L, Zhang T, Chen Q (2021) Involution: Inverting the inherence of convolution for visual recognition. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 12321\u201312330","DOI":"10.1109\/CVPR46437.2021.01214"},{"key":"2182_CR68","doi-asserted-by":"crossref","unstructured":"Lin T-Y, Goyal P, Girshick R, He K, Doll\u00e1r P (2017) Focal loss for dense object detection. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 2980\u20132988","DOI":"10.1109\/ICCV.2017.324"},{"key":"2182_CR69","unstructured":"Shao S, Zhao Z, Li B, Xiao T, Yu G, Zhang X, Sun J (2018) Crowdhuman: A benchmark for detecting human in a crowd"},{"key":"2182_CR70","doi-asserted-by":"crossref","unstructured":"Ess A, Leibe B, Schindler K, Van\u00a0Gool L (2008) A mobile vision system for robust multi-person tracking. In: 2008 IEEE Conference on Computer Vision and Pattern Recognition, pp. 1\u20138. IEEE","DOI":"10.1109\/CVPR.2008.4587730"},{"key":"2182_CR71","doi-asserted-by":"crossref","unstructured":"Zhang S, Benenson R, Schiele B (2017) Citypersons: A diverse dataset for pedestrian detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 3213\u20133221","DOI":"10.1109\/CVPR.2017.474"},{"key":"2182_CR72","doi-asserted-by":"crossref","unstructured":"Doll\u00e1r P, Wojek C, Schiele B, Perona P (2009) Pedestrian detection: A benchmark. In: 2009 IEEE Conference on Computer Vision and Pattern Recognition, pp. 304\u2013311. IEEE","DOI":"10.1109\/CVPR.2009.5206631"},{"key":"2182_CR73","doi-asserted-by":"crossref","unstructured":"Xiao T, Li S, Wang B, Lin L, Wang X (2017) Joint detection and identification feature learning for person search. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 3415\u20133424","DOI":"10.1109\/CVPR.2017.360"},{"key":"2182_CR74","doi-asserted-by":"crossref","unstructured":"Zheng L, Zhang H, Sun S, Chandraker M, Yang Y, Tian Q (2017) Person re-identification in the wild. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1367\u20131376","DOI":"10.1109\/CVPR.2017.357"},{"key":"2182_CR75","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1155\/2008\/246309","volume":"2008","author":"K Bernardin","year":"2008","unstructured":"Bernardin K, Stiefelhagen R (2008) Evaluating multiple object tracking performance: the clear mot metrics. EURASIP Journal on Image and Video Processing 2008:1\u201310","journal-title":"EURASIP Journal on Image and Video Processing"},{"key":"2182_CR76","doi-asserted-by":"publisher","first-page":"548","DOI":"10.1007\/s11263-020-01375-2","volume":"129","author":"J Luiten","year":"2021","unstructured":"Luiten J, Osep A, Dendorfer P, Torr P, Geiger A, Leal-Taix\u00e9 L, Leibe B (2021) Hota: A higher order metric for evaluating multi-object tracking. Int J Comput Vision 129:548\u2013578","journal-title":"Int J Comput Vision"},{"key":"2182_CR77","doi-asserted-by":"crossref","unstructured":"Lin T-Y, Maire M, Belongie S, Hays J, Perona P, Ramanan D, Doll\u00e1r P, Zitnick CL (2014) Microsoft coco: Common objects in context. In: Computer Vision\u2013ECCV 2014: 13th European Conference, Zurich, Switzerland, September 6-12, 2014, Proceedings, Part V 13, pp. 740\u2013755. Springer","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"2182_CR78","unstructured":"Kingma DP, Ba J (2014) Adam: A method for stochastic optimization"},{"key":"2182_CR79","doi-asserted-by":"crossref","unstructured":"Pang B, Li Y, Zhang Y, Li M, Lu C (2020) Tubetk: Adopting tubes to track multi-object in a one-step training model. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 6308\u20136318","DOI":"10.1109\/CVPR42600.2020.00634"},{"key":"2182_CR80","doi-asserted-by":"crossref","unstructured":"Wang Y, Kitani K, Weng X (2021) Joint object detection and multi-object tracking with graph neural networks. In: 2021 IEEE International Conference on Robotics and Automation (ICRA), pp. 13708\u201313715. IEEE","DOI":"10.1109\/ICRA48506.2021.9561110"},{"key":"2182_CR81","doi-asserted-by":"crossref","unstructured":"Zhou X, Yin T, Koltun V, Kr\u00e4henb\u00fchl P (2022) Global tracking transformers. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 8771\u20138780","DOI":"10.1109\/CVPR52688.2022.00857"},{"key":"2182_CR82","doi-asserted-by":"publisher","unstructured":"Lee S-H, Park D-H, Bae S-H (2023) Decode-mot: How can we hurdle frames to go beyond tracking-by-detection? IEEE Transactions on Image Processing 32, 4378\u20134392 https:\/\/doi.org\/10.1109\/TIP.2023.3298538","DOI":"10.1109\/TIP.2023.3298538"},{"key":"2182_CR83","doi-asserted-by":"publisher","unstructured":"Fukui H, Miyagawa T, Morishita Y (2023) Multi-object tracking as attention mechanism. In: 2023 IEEE International Conference on Image Processing (ICIP), pp. 505\u2013509. https:\/\/doi.org\/10.1109\/ICIP49359.2023.10222207","DOI":"10.1109\/ICIP49359.2023.10222207"},{"key":"2182_CR84","doi-asserted-by":"crossref","unstructured":"Stadler D, Beyerer J (2021) Improving multiple pedestrian tracking by track management and occlusion handling. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10958\u201310967","DOI":"10.1109\/CVPR46437.2021.01081"},{"key":"2182_CR85","doi-asserted-by":"publisher","first-page":"333","DOI":"10.1016\/j.neucom.2022.01.008","volume":"483","author":"Q Liu","year":"2022","unstructured":"Liu Q, Chen D, Chu Q, Yuan L, Liu B, Zhang L, Yu N (2022) Online multi-object tracking with unsupervised re-identification learning and occlusion estimation. Neurocomputing 483:333\u2013347","journal-title":"Neurocomputing"}],"container-title":["International Journal of Machine Learning and Cybernetics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s13042-024-02182-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s13042-024-02182-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s13042-024-02182-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,22]],"date-time":"2025-01-22T07:39:53Z","timestamp":1737531593000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s13042-024-02182-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,5,2]]},"references-count":85,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2025,1]]}},"alternative-id":["2182"],"URL":"https:\/\/doi.org\/10.1007\/s13042-024-02182-8","relation":{},"ISSN":["1868-8071","1868-808X"],"issn-type":[{"type":"print","value":"1868-8071"},{"type":"electronic","value":"1868-808X"}],"subject":[],"published":{"date-parts":[[2024,5,2]]},"assertion":[{"value":"11 October 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 April 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 May 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}