{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,12]],"date-time":"2026-02-12T10:51:10Z","timestamp":1770893470922,"version":"3.50.1"},"reference-count":84,"publisher":"Springer Science and Business Media LLC","issue":"5","license":[{"start":{"date-parts":[[2023,12,2]],"date-time":"2023-12-02T00:00:00Z","timestamp":1701475200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,12,2]],"date-time":"2023-12-02T00:00:00Z","timestamp":1701475200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100004739","name":"Youth Innovation Promotion Association of the Chinese Academy of Sciences","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100004739","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Comput Vis"],"published-print":{"date-parts":[[2024,5]]},"DOI":"10.1007\/s11263-023-01937-0","type":"journal-article","created":{"date-parts":[[2023,12,2]],"date-time":"2023-12-02T08:02:05Z","timestamp":1701504125000},"page":"1659-1684","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":14,"title":["BioDrone: A Bionic Drone-Based Single Object Tracking Benchmark for Robust Vision"],"prefix":"10.1007","volume":"132","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-7660-9897","authenticated-orcid":false,"given":"Xin","family":"Zhao","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5872-7566","authenticated-orcid":false,"given":"Shiyu","family":"Hu","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0009-0005-0125-9553","authenticated-orcid":false,"given":"Yipei","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Jing","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Yimin","family":"Hu","sequence":"additional","affiliation":[]},{"given":"Rongshuai","family":"Liu","sequence":"additional","affiliation":[]},{"given":"Haibin","family":"Ling","sequence":"additional","affiliation":[]},{"given":"Yin","family":"Li","sequence":"additional","affiliation":[]},{"given":"Renshu","family":"Li","sequence":"additional","affiliation":[]},{"given":"Kun","family":"Liu","sequence":"additional","affiliation":[]},{"given":"Jiadong","family":"Li","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,12,2]]},"reference":[{"issue":"9","key":"1937_CR1","doi-asserted-by":"publisher","first-page":"961","DOI":"10.1007\/s11263-018-1070-x","volume":"126","author":"H Abu Alhaija","year":"2018","unstructured":"Abu Alhaija, H., Mustikovela, S. K., Mescheder, L., Geiger, A., & Rother, C. (2018). Augmented reality meets computer vision: Efficient data generation for urban driving scenes. International Journal of Computer Vision, 126(9), 961\u2013972.","journal-title":"International Journal of Computer Vision"},{"key":"1937_CR2","doi-asserted-by":"crossref","unstructured":"Barrientos, A., Colorado, J., Martinez, A., & Valente, J. (2010). Rotary-wing mav modeling and control for indoor scenarios. In 2010 IEEE international conference on industrial technology (pp. 1475\u20131480). IEEE.","DOI":"10.1109\/ICIT.2010.5472486"},{"key":"1937_CR3","doi-asserted-by":"crossref","unstructured":"Bertinetto, L., Valmadre, J., Henriques, J. F., Vedaldi, A., & Torr, P. H. (2016). Fully-convolutional siamese networks for object tracking. In European conference on computer vision (pp. 850\u2013865). Springer.","DOI":"10.1007\/978-3-319-48881-3_56"},{"key":"1937_CR4","doi-asserted-by":"crossref","unstructured":"Bhat, G., Danelljan, M., Gool, L. V., & Timofte, R. (2019). Learning discriminative model prediction for tracking. In Proceedings of the IEEE\/CVF international conference on computer vision (pp. 6182\u20136191).","DOI":"10.1109\/ICCV.2019.00628"},{"key":"1937_CR5","doi-asserted-by":"crossref","unstructured":"Bhat, G., Danelljan, M., Gool, L. V., & Timofte, R. (2020). Know your surroundings: Exploiting scene information for object tracking. In European conference on computer vision (pp. 205\u2013221). Springer.","DOI":"10.1007\/978-3-030-58592-1_13"},{"key":"1937_CR6","doi-asserted-by":"crossref","unstructured":"Bondi, E., Dey, D., Kapoor, A., Piavis, J., Shah, S., Fang, F., Dilkina, B., Hannaford, R., Iyer, A., Joppa, L., et\u00a0al. (2018). Airsim-w: A simulation environment for wildlife conservation with uavs. In Proceedings of the 1st ACM SIGCAS conference on computing and sustainable societies (pp. 1\u201312).","DOI":"10.1145\/3209811.3209880"},{"key":"1937_CR7","doi-asserted-by":"crossref","unstructured":"Bondi, E., Jain, R., Aggrawal, P., Anand, S., Hannaford, R., Kapoor, A., Piavis, J., Shah, S., Joppa, L., & Dilkina, B., et\u00a0al. (2020). Birdsai: A dataset for detection and tracking in aerial thermal infrared videos. In Proceedings of the IEEE\/CVF Winter conference on applications of computer vision (pp. 1747\u20131756).","DOI":"10.1109\/WACV45572.2020.9093284"},{"key":"1937_CR8","doi-asserted-by":"crossref","unstructured":"Cao, Z., Huang, Z., Pan, L., Zhang, S., Liu, Z., & Fu, C. (2022). Tctrack: Temporal contexts for aerial tracking. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 14798\u201314808).","DOI":"10.1109\/CVPR52688.2022.01438"},{"key":"1937_CR9","doi-asserted-by":"crossref","unstructured":"Chatfield, K., Simonyan, K., Vedaldi, A., & Zisserman, A. (2014). Return of the devil in the details: Delving deep into convolutional nets. arXiv preprint arXiv:1405.3531.","DOI":"10.5244\/C.28.6"},{"key":"1937_CR10","doi-asserted-by":"crossref","unstructured":"Cui, Y., Jiang, C., Wang, L., & Wu, G. (2022). Mixformer: End-to-end tracking with iterative mixed attention. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 13608\u201313618).","DOI":"10.1109\/CVPR52688.2022.01324"},{"key":"1937_CR11","doi-asserted-by":"crossref","unstructured":"Dalal, N., & Triggs, B. (2005). Histograms of oriented gradients for human detection. In 2005 IEEE Computer Society Conference on Computer Vision and Pattern Recognition (CVPR\u201905) (Vol. 1, pp. 886\u2013893). IEEE.","DOI":"10.1109\/CVPR.2005.177"},{"key":"1937_CR12","doi-asserted-by":"crossref","unstructured":"Danelljan, M., Bhat, G., Khan, F. S., & Felsberg, M. (2019). Atom: Accurate tracking by overlap maximization. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 4660\u20134669).","DOI":"10.1109\/CVPR.2019.00479"},{"key":"1937_CR13","doi-asserted-by":"crossref","unstructured":"Danelljan, M., Bhat, G., Shahbaz\u00a0Khan, F., & Felsberg, M. (2017). Eco: Efficient convolution operators for tracking. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 6638\u20136646).","DOI":"10.1109\/CVPR.2017.733"},{"key":"1937_CR14","doi-asserted-by":"crossref","unstructured":"Danelljan, M., Gool, L. V., & Timofte, R. (2020). Probabilistic regression for visual tracking. In 2020 IEEE conference on computer vision and pattern recognition (CVPR).","DOI":"10.1109\/CVPR42600.2020.00721"},{"key":"1937_CR15","doi-asserted-by":"publisher","first-page":"978","DOI":"10.1007\/978-94-017-9208-0","volume-title":"The delfly","author":"G De Croon","year":"2016","unstructured":"De Croon, G., Per\u00e7in, M., Remes, B., Ruijsink, R., & De Wagter, C. (2016). The delfly (pp. 978\u201394). Dordrecht: Springer."},{"issue":"4","key":"1937_CR16","doi-asserted-by":"publisher","first-page":"845","DOI":"10.1007\/s11263-020-01393-0","volume":"129","author":"P Dendorfer","year":"2021","unstructured":"Dendorfer, P., Osep, A., Milan, A., Schindler, K., Cremers, D., Reid, I., Roth, S., & Leal-Taix\u00e9, L. (2021). Motchallenge: A benchmark for single-camera multiple target tracking. International Journal of Computer Vision, 129(4), 845\u2013881.","journal-title":"International Journal of Computer Vision"},{"key":"1937_CR17","doi-asserted-by":"crossref","unstructured":"DeTone, D., Malisiewicz, T., & Rabinovich, A. (2018). Superpoint: Self-supervised interest point detection and description. In Proceedings of the IEEE conference on computer vision and pattern recognition workshops (pp. 224\u2013236).","DOI":"10.1109\/CVPRW.2018.00060"},{"issue":"27","key":"1937_CR18","doi-asserted-by":"publisher","first-page":"eaau0307","DOI":"10.1126\/scirobotics.aau0307","volume":"4","author":"J Dupeyroux","year":"2019","unstructured":"Dupeyroux, J., Serres, J. R., & Viollet, S. (2019). Antbot: A six-legged walking robot able to home like desert ants in outdoor environments. Science Robotics, 4(27), eaau0307.","journal-title":"Science Robotics"},{"issue":"2","key":"1937_CR19","doi-asserted-by":"publisher","first-page":"439","DOI":"10.1007\/s11263-020-01387-y","volume":"129","author":"H Fan","year":"2021","unstructured":"Fan, H., Bai, H., Lin, L., Yang, F., Chu, P., Deng, G., Yu, S., Huang, M., Liu, J., Xu, Y., et al. (2021). Lasot: A high-quality large-scale single object tracking benchmark. International Journal of Computer Vision, 129(2), 439\u2013461.","journal-title":"International Journal of Computer Vision"},{"key":"1937_CR20","doi-asserted-by":"crossref","unstructured":"Finlayson, G. D., & Trezzi, E. (2004). Shades of gray and colour constancy. In The twelfth color imaging conference 2004 (pp. 37\u201341).","DOI":"10.2352\/CIC.2004.12.1.art00008"},{"key":"1937_CR21","doi-asserted-by":"crossref","unstructured":"Fraire, A. E., Morado, R. P., L\u00f3pez, A. D., & Leal, R. L. (2015). Design and implementation of fixed-wing mav controllers. In 2015 Workshop on research, education and development of unmanned aerial systems (RED-UAS) (pp. 172\u2013179). IEEE.","DOI":"10.1109\/RED-UAS.2015.7441004"},{"issue":"3","key":"1937_CR22","doi-asserted-by":"publisher","first-page":"335","DOI":"10.1007\/s11263-011-0431-5","volume":"94","author":"S Gauglitz","year":"2011","unstructured":"Gauglitz, S., H\u00f6llerer, T., & Turk, M. (2011). Evaluation of interest point detectors and feature descriptors for visual tracking. International Journal of Computer Vision, 94(3), 335\u2013360.","journal-title":"International Journal of Computer Vision"},{"key":"1937_CR23","doi-asserted-by":"crossref","unstructured":"Girshick, R. (2015). Fast r-cnn. In Proceedings of the IEEE international conference on computer vision (pp. 1440\u20131448).","DOI":"10.1109\/ICCV.2015.169"},{"key":"1937_CR24","doi-asserted-by":"crossref","unstructured":"Guo, D., Wang, J., Cui, Y., Wang, Z., & Chen, S. (2020). Siamcar: Siamese fully convolutional classification and regression for visual tracking. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 6269\u20136277).","DOI":"10.1109\/CVPR42600.2020.00630"},{"issue":"10","key":"1937_CR25","doi-asserted-by":"publisher","first-page":"2927","DOI":"10.1007\/s11263-021-01507-2","volume":"129","author":"L Han","year":"2021","unstructured":"Han, L., Wang, P., Yin, Z., Wang, F., & Li, H. (2021). Context and structure mining network for video object detection. International Journal of Computer Vision, 129(10), 2927\u20132946.","journal-title":"International Journal of Computer Vision"},{"key":"1937_CR26","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., & Sun, J. (2016). Deep residual learning for image recognition. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 770\u2013778).","DOI":"10.1109\/CVPR.2016.90"},{"issue":"3","key":"1937_CR27","doi-asserted-by":"publisher","first-page":"583","DOI":"10.1109\/TPAMI.2014.2345390","volume":"37","author":"JF Henriques","year":"2014","unstructured":"Henriques, J. F., Caseiro, R., Martins, P., & Batista, J. (2014). High-speed tracking with kernelized correlation filters. IEEE Transactions on Pattern Analysis and Machine Intelligence, 37(3), 583\u2013596.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"1937_CR28","doi-asserted-by":"crossref","unstructured":"Hsieh, M.-R., Lin, Y.-L., & Hsu, W. H. (2017). Drone-based object counting by spatially regularized regional proposal network. In Proceedings of the IEEE international conference on computer vision (pp. 4145\u20134153).","DOI":"10.1109\/ICCV.2017.446"},{"issue":"2","key":"1937_CR29","doi-asserted-by":"publisher","first-page":"316","DOI":"10.1007\/s11263-021-01554-9","volume":"130","author":"Q Hu","year":"2022","unstructured":"Hu, Q., Yang, B., Khalid, S., Xiao, W., Trigoni, N., & Markham, A. (2022). Sensaturban: Learning semantics from urban-scale photogrammetric point clouds. International Journal of Computer Vision, 130(2), 316\u2013343.","journal-title":"International Journal of Computer Vision"},{"key":"1937_CR30","doi-asserted-by":"publisher","unstructured":"Hu, S., Zhao, X. & Huang, K. (2023). SOTVerse: A user-defined task space of single object tracking. International Journal of Computer Vision.https:\/\/doi.org\/10.1007\/s11263-023-01908-5.","DOI":"10.1007\/s11263-023-01908-5"},{"issue":"1","key":"1937_CR31","doi-asserted-by":"publisher","first-page":"576","DOI":"10.1109\/TPAMI.2022.3153312","volume":"45","author":"S Hu","year":"2023","unstructured":"Hu, S., Zhao, X., Huang, L., & Huang, K. (2023). Global instance tracking: Locating target more like humans. IEEE Transactions on Pattern Analysis and Machine Intelligence, 45(1), 576\u2013592.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"1937_CR32","doi-asserted-by":"crossref","unstructured":"Huang, L., Zhao, X., & Huang, K. (2020). Globaltrack: A simple and strong baseline for long-term tracking. In Proceedings of the AAAI conference on artificial intelligence (Vol. 34, pp. 11037\u201311044).","DOI":"10.1609\/aaai.v34i07.6758"},{"issue":"5","key":"1937_CR33","doi-asserted-by":"publisher","first-page":"1562","DOI":"10.1109\/TPAMI.2019.2957464","volume":"43","author":"L Huang","year":"2021","unstructured":"Huang, L., Zhao, X., & Huang, K. (2021). Got-10k: A large high-diversity benchmark for generic object tracking in the wild. IEEE Transactions on Pattern Analysis and Machine Intelligence, 43(5), 1562\u20131577.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"1937_CR34","doi-asserted-by":"crossref","unstructured":"Jiang, B., Luo, R., Mao, J., Xiao, T., & Jiang, Y. (2018). Acquisition of localization confidence for accurate object detection. In Proceedings of the European conference on computer vision (ECCV) (pp. 784\u2013799).","DOI":"10.1007\/978-3-030-01264-9_48"},{"issue":"5","key":"1937_CR35","doi-asserted-by":"publisher","first-page":"1366","DOI":"10.1007\/s11263-022-01594-9","volume":"130","author":"Y Kong","year":"2022","unstructured":"Kong, Y., & Fu, Y. (2022). Human action recognition and prediction: A survey. International Journal of Computer Vision, 130(5), 1366\u20131401.","journal-title":"International Journal of Computer Vision"},{"key":"1937_CR36","doi-asserted-by":"crossref","unstructured":"Kristan, M., Leonardis, A., Matas, J., Felsberg, M., Pflugfelder, R., \u010cehovin, L., Voj\u00edr, T., H\u00e4ger, G., Luke\u017ei\u010d, A., Fern\u00e1ndez, G., Gupta, A., Petrosino, A., Memarmoghadam, A., Garcia-Martin, A., Sol\u00eds\u00a0Montero, A., et al. (2016). The visual object tracking VOT2016 challenge results. In Computer vision\u2014ECCV 2016 workshops (pp. 777\u2013823). Springer.","DOI":"10.1007\/978-3-319-48881-3_54"},{"key":"1937_CR37","doi-asserted-by":"crossref","unstructured":"Kristan, M., Leonardis, A., Matas, J., Felsberg, M., Pflugfelder, R., K\u00e4m\u00e4r\u00e4inen, J.-K., Danelljan, M., Zajc, L.\u010c., Luke\u017ei\u010d, A., Drbohlav, O., He, L., et al. (2020). The eighth visual object tracking VOT2020 challenge results. In Computer vision\u2014ECCV 2020 workshops (pp. 547\u2013601). Springer.","DOI":"10.1007\/978-3-030-68238-5_39"},{"key":"1937_CR38","unstructured":"Kristan, M., Leonardis, A., Matas, J., Felsberg, M., Pflugfelder, R., Zajc, L. \u010c., Voj\u00edr, T., Bhat, G., Luke\u017ei\u010d, A., Eldesokey, A., Fern\u00e1ndez, G., et al. (2019a). The sixth visual object tracking VOT2018 challenge results. In Computer vision\u2014ECCV 2018 workshops (pp. 3\u201353). Springer."},{"key":"1937_CR39","doi-asserted-by":"crossref","unstructured":"Kristan, M., Leonardis, A., Matas, J., Felsberg, M., Pflugfelder, R., Zajc, L. C., Voj\u00edr, T., H\u00e4ger, G., Luke\u017eic, A., Eldesokey, A., Fern\u00e1ndez, G., Garc\u00eda-Mart\u00edn, \u00c1., Muhic, A., Petrosino, A., Memarmoghadam, A., et al. (2017). The visual object tracking VOT2017 challenge results. In Proceedings of 2017 IEEE international conference on computer vision workshops (ICCVW) (pp. 1949\u20131972). IEEE, Venice, Italy.","DOI":"10.1109\/ICCVW.2017.230"},{"key":"1937_CR40","unstructured":"Kristan, M., Matas, J., Leonardis, A., Felsberg, M., Cehovin, L., Fernandez, G., Vojir, T., Hager, G., Nebehay, G., Pflugfelder, R., Gupta, A., Bibi, A., Lukezic, A., Garcia-Martin, A., Saffari, A., Petrosino, A., & Solis\u00a0Montero, A. (2015). The visual object tracking VOT2015 challenge results. In Proceedings of 2015 IEEE international conference on computer vision workshop (ICCVW) (pp. 564\u2013586). IEEE."},{"key":"1937_CR41","unstructured":"Kristan, M., Matas, J., Leonardis, A., Felsberg, M., Pflugfelder, R., K\u00e4m\u00e4r\u00e4inen, J.-K., Cehovin\u00a0Zajc, L., Drbohlav, O., Lukezic, A., Berg, A., Eldesokey, A., K\u00e4pyl\u00e4, J., Fern\u00e1ndez, G., Gonzalez-Garcia, A., Memarmoghadam, A., et al. (2019b). The seventh visual object tracking VOT2019 challenge results. In Proceedings of 2019 IEEE\/CVF international conference on computer vision workshop (ICCVW) (pp. 2206\u20132241). IEEE, Seoul, Korea (South)."},{"key":"1937_CR42","doi-asserted-by":"crossref","unstructured":"Kristan, M., Matas, J., Leonardis, A., Felsberg, M., Pflugfelder, R., K\u00e4m\u00e4r\u00e4inen, J.-K., Chang, H. J., Danelljan, M., Zajc, L. \u010c., Luke\u017ei\u010d, A., Drbohlav, O., et al. (2021). The ninth visual object tracking VOT2021 challenge results. In Proceedings of 2021 IEEE\/CVF international conference on computer vision workshops (ICCVW) (pp. 2711\u20132738). IEEE, Montreal, BC, Canada.","DOI":"10.1109\/ICCVW54120.2021.00305"},{"key":"1937_CR43","doi-asserted-by":"crossref","unstructured":"Kristan, M., Pflugfelder, R., Leonardis, A., Matas, J., Porikli, F., Cehovin, L., Nebehay, G., Fernandez, G., Vojir, T., Gatt, A., Khajenezhad, A., Salahledin, A., Soltani-Farani, A., et al. (2013). The visual object tracking VOT2013 challenge results. In Proceedings of 2013 IEEE international conference on computer vision workshops (ICCVW) (pp. 98\u2013111). IEEE.","DOI":"10.1109\/ICCVW.2013.20"},{"key":"1937_CR44","doi-asserted-by":"publisher","first-page":"191","DOI":"10.1007\/978-3-319-16181-5_14","volume-title":"Computer vision: ECCV 2014 workshops","author":"M Kristan","year":"2014","unstructured":"Kristan, M., Pflugfelder, R. P., Leonardis, A., Matas, J., Cehovin, L., Nebehay, G., Voj\u00edr, T., Fern\u00e1ndez, G., Lukezic, A., Dimitriev, A., Petrosino, A., Saffari, A. A., et al. (2014). The visual object tracking VOT2014 challenge results. In L. Agapito, M. M. Bronstein, & C. Rother (Eds.), Computer vision: ECCV 2014 workshops (Vol. 8926, pp. 191\u2013217). Springer."},{"key":"1937_CR45","unstructured":"Krizhevsky, A., Sutskever, I., & Hinton, G. E. (2012). Imagenet classification with deep convolutional neural networks. In Advances in neural information processing systems 25."},{"key":"1937_CR46","doi-asserted-by":"publisher","first-page":"111","DOI":"10.1016\/j.compfluid.2018.03.017","volume":"173","author":"N Lee","year":"2018","unstructured":"Lee, N., Lee, S., Cho, H., & Shin, S. (2018). Effect of flexibility on flapping wing characteristics in hover and forward flight. Computers & Fluids, 173, 111\u2013117.","journal-title":"Computers & Fluids"},{"key":"1937_CR47","doi-asserted-by":"crossref","unstructured":"Li, B., Wu, W., Wang, Q., Zhang, F., Xing, J., & Yan, J. (2019). Siamrpn++: Evolution of siamese visual tracking with very deep networks. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 4282\u20134291).","DOI":"10.1109\/CVPR.2019.00441"},{"key":"1937_CR48","doi-asserted-by":"crossref","unstructured":"Li, B., Yan, J., Wu, W., Zhu, Z., & Hu, X. (2018). High performance visual tracking with siamese region proposal network. In The IEEE conference on computer vision and pattern recognition (CVPR).","DOI":"10.1109\/CVPR.2018.00935"},{"key":"1937_CR49","doi-asserted-by":"crossref","unstructured":"Li, S., & Yeung, D.-Y. (2017). Visual object tracking for unmanned aerial vehicles: A benchmark and new motion models. In Thirty-first AAAI conference on artificial intelligence.","DOI":"10.1609\/aaai.v31i1.11205"},{"issue":"2","key":"1937_CR50","doi-asserted-by":"publisher","first-page":"261","DOI":"10.1007\/s11263-019-01247-4","volume":"128","author":"L Liu","year":"2020","unstructured":"Liu, L., Ouyang, W., Wang, X., Fieguth, P., Chen, J., Liu, X., & Pietik\u00e4inen, M. (2020). Deep learning for generic object detection: A survey. International Journal of Computer Vision, 128(2), 261\u2013318.","journal-title":"International Journal of Computer Vision"},{"issue":"2","key":"1937_CR51","doi-asserted-by":"publisher","first-page":"548","DOI":"10.1007\/s11263-020-01375-2","volume":"129","author":"J Luiten","year":"2021","unstructured":"Luiten, J., Osep, A., Dendorfer, P., Torr, P., Geiger, A., Leal-Taix\u00e9, L., & Leibe, B. (2021). Hota: A higher order metric for evaluating multi-object tracking. International Journal of Computer Vision, 129(2), 548\u2013578.","journal-title":"International Journal of Computer Vision"},{"key":"1937_CR52","doi-asserted-by":"crossref","unstructured":"Mayer, C., Danelljan, M., Paudel, D.P., & Van\u00a0Gool, L. (2021). Learning target candidate association to keep track of what not to track. In Proceedings of the IEEE\/CVF international conference on computer vision (pp. 13444\u201313454).","DOI":"10.1109\/ICCV48922.2021.01319"},{"key":"1937_CR53","doi-asserted-by":"crossref","unstructured":"McMasters, J., & Cummings, R. (2004). Rethinking the airplane design process: An early 21st century perspective. In 42nd AIAA aerospace sciences meeting and exhibit (p. 693).","DOI":"10.2514\/6.2004-693"},{"issue":"1","key":"1937_CR54","doi-asserted-by":"publisher","first-page":"10","DOI":"10.2514\/2.2919","volume":"39","author":"JH McMasters","year":"2002","unstructured":"McMasters, J. H., & Cummings, R. M. (2002). Airplane design: Past, present, and future. Journal of Aircraft, 39(1), 10\u201317.","journal-title":"Journal of Aircraft"},{"key":"1937_CR55","doi-asserted-by":"crossref","unstructured":"Muller, M., Bibi, A., Giancola, S., Alsubaihi, S., & Ghanem, B. (2018). Trackingnet: A large-scale dataset and benchmark for object tracking in the wild. In Proceedings of the European conference on computer vision (ECCV) (pp. 300\u2013317).","DOI":"10.1007\/978-3-030-01246-5_19"},{"issue":"9","key":"1937_CR56","doi-asserted-by":"publisher","first-page":"902","DOI":"10.1007\/s11263-018-1073-7","volume":"126","author":"M M\u00fcller","year":"2018","unstructured":"M\u00fcller, M., Casser, V., Lahoud, J., Smith, N., & Ghanem, B. (2018). Sim4cv: A photo-realistic simulator for computer vision applications. International Journal of Computer Vision, 126(9), 902\u2013919.","journal-title":"International Journal of Computer Vision"},{"key":"1937_CR57","doi-asserted-by":"crossref","unstructured":"Mueller, M., Smith, N., & Ghanem, B. (2016). A benchmark and simulator for uav tracking. In European conference on computer vision (pp. 445\u2013461). Springer.","DOI":"10.1007\/978-3-319-46448-0_27"},{"key":"1937_CR58","doi-asserted-by":"crossref","unstructured":"Pech-Pacheco, J. L., Cristobal, G., Chamorro-Martinez, J., & Fernandez-Valdivia, J. (2000). Diatom autofocusing in brightfield microscopy: A comparative study. In Proceedings 15th international conference on pattern recognition. ICPR-2000 (Vol. 3, pp. 314\u2013317).","DOI":"10.1109\/ICPR.2000.903548"},{"key":"1937_CR59","unstructured":"Pornsin-Sirirak, T. N., Tai, Y.-C., Ho, C.-M., & Keennon, M. (2001). Microbat: A palm-sized electrically powered ornithopter. In Proceedings of NASA\/JPL workshop on biomorphic robotics (Vol. 14, p. 17). Citeseer."},{"issue":"5","key":"1937_CR60","doi-asserted-by":"publisher","first-page":"1616","DOI":"10.1007\/s11263-021-01437-z","volume":"129","author":"SK Ramakrishnan","year":"2021","unstructured":"Ramakrishnan, S. K., Jayaraman, D., & Grauman, K. (2021). An exploration of embodied visual exploration. International Journal of Computer Vision, 129(5), 1616\u20131649.","journal-title":"International Journal of Computer Vision"},{"key":"1937_CR61","unstructured":"Ren, S., He, K., Girshick, R., & Sun, J. (2015). Faster r-cnn: Towards real-time object detection with region proposal networks. In Advances in neural information processing systems, 28."},{"key":"1937_CR62","doi-asserted-by":"crossref","unstructured":"Rezatofighi, H., Tsoi, N., Gwak, J., Sadeghian, A., Reid, I., & Savarese, S. (2019). Generalized intersection over union: A metric and a loss for bounding box regression. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 658\u2013666).","DOI":"10.1109\/CVPR.2019.00075"},{"issue":"6","key":"1937_CR63","doi-asserted-by":"publisher","first-page":"534","DOI":"10.1108\/ir.2004.31.6.534.2","volume":"31","author":"J Rigelsford","year":"2004","unstructured":"Rigelsford, J. (2004). Neurotechnology for biomimetic robots. Industrial Robot: An International Journal, 31(6), 534.","journal-title":"Industrial Robot: An International Journal"},{"issue":"3","key":"1937_CR64","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1007\/s11263-015-0816-y","volume":"115","author":"O Russakovsky","year":"2015","unstructured":"Russakovsky, O., Deng, J., Su, H., Krause, J., Satheesh, S., Ma, S., Huang, Z., Karpathy, A., Khosla, A., Bernstein, M., et al. (2015). Imagenet large scale visual recognition challenge. International Journal of Computer Vision, 115(3), 211\u2013252.","journal-title":"International Journal of Computer Vision"},{"key":"1937_CR65","doi-asserted-by":"crossref","unstructured":"Ryu, S., Kwon, U., & Kim, H. J. (2016). Autonomous flight and vision-based target tracking for a flapping-wing mav. In 2016 IEEE\/RSJ international conference on intelligent robots and systems (IROS) (pp. 5645\u20135650). IEEE.","DOI":"10.1109\/IROS.2016.7759830"},{"key":"1937_CR66","doi-asserted-by":"crossref","unstructured":"Sarlin, P.-E., DeTone, D., Malisiewicz, T., & Rabinovich, A. (2020). Superglue: Learning feature matching with graph neural networks. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 4938\u20134947).","DOI":"10.1109\/CVPR42600.2020.00499"},{"key":"1937_CR67","doi-asserted-by":"publisher","first-page":"1591","DOI":"10.2307\/2938280","volume":"59","author":"CA Sims","year":"1991","unstructured":"Sims, C. A., & Uhlig, H. (1991). Understanding unit rooters: A helicopter tour. Econometrica: Journal of the Econometric Society, 59, 1591\u20131599.","journal-title":"Econometrica: Journal of the Econometric Society"},{"key":"1937_CR68","doi-asserted-by":"crossref","unstructured":"Tan, M., Pang, R., & Le, Q. V. (2020). Efficientdet: Scalable and efficient object detection. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 10781\u201310790).","DOI":"10.1109\/CVPR42600.2020.01079"},{"key":"1937_CR69","doi-asserted-by":"crossref","unstructured":"Tian, Z., Shen, C., Chen, H., & He, T. (2019). Fcos: Fully convolutional one-stage object detection. In Proceedings of the IEEE\/CVF international conference on computer vision (pp. 9627\u20139636).","DOI":"10.1109\/ICCV.2019.00972"},{"issue":"7","key":"1937_CR70","doi-asserted-by":"publisher","first-page":"1512","DOI":"10.1109\/TIP.2009.2019809","volume":"18","author":"J Van De Weijer","year":"2009","unstructured":"Van De Weijer, J., Schmid, C., Verbeek, J., & Larlus, D. (2009). Learning color names for real-world applications. IEEE Transactions on Image Processing, 18(7), 1512\u20131523.","journal-title":"IEEE Transactions on Image Processing"},{"key":"1937_CR71","doi-asserted-by":"crossref","unstructured":"Voigtlaender, P., Luiten, J., Torr, P. H., & Leibe, B. (2020). Siam r-cnn: Visual tracking by re-detection. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 6578\u20136588).","DOI":"10.1109\/CVPR42600.2020.00661"},{"issue":"1","key":"1937_CR72","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1109\/MGRS.2021.3115137","volume":"10","author":"X Wu","year":"2021","unstructured":"Wu, X., Li, W., Hong, D., Tao, R., & Du, Q. (2021). Deep learning for unmanned aerial vehicle-based object detection and tracking: A survey. IEEE Geoscience and Remote Sensing Magazine, 10(1), 91\u2013124.","journal-title":"IEEE Geoscience and Remote Sensing Magazine"},{"key":"1937_CR73","doi-asserted-by":"crossref","unstructured":"Wu, Y., Lim, J., & Yang, M.-H. (2013). Online object tracking: A benchmark. In 2013 IEEE conference on computer vision and pattern recognition (pp. 2411\u20132418).","DOI":"10.1109\/CVPR.2013.312"},{"issue":"9","key":"1937_CR74","doi-asserted-by":"publisher","first-page":"1834","DOI":"10.1109\/TPAMI.2014.2388226","volume":"37","author":"Y Wu","year":"2015","unstructured":"Wu, Y., Lim, J., & Yang, M.-H. (2015). Object tracking benchmark. IEEE Transactions on Pattern Analysis and Machine Intelligence, 37(9), 1834\u20131848.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"1937_CR75","doi-asserted-by":"crossref","unstructured":"Xia, G.-S., Bai, X., Ding, J., Zhu, Z., Belongie, S., Luo, J., Datcu, M., Pelillo, M., & Zhang, L. (2018). Dota: A large-scale dataset for object detection in aerial images. In Proceedings of the IEEE conference on computer vision and pattern recognition (pp. 3974\u20133983).","DOI":"10.1109\/CVPR.2018.00418"},{"key":"1937_CR76","doi-asserted-by":"crossref","unstructured":"Xu, Y., Wang, Z., Li, Z., Yuan, Y., & Yu, G. (2020). Siamfc++: Towards robust and accurate visual tracking with target estimation guidelines. In Proceedings of the AAAI conference on artificial intelligence (Vol. 34, pp. 12549\u201312556).","DOI":"10.1609\/aaai.v34i07.6944"},{"issue":"1","key":"1937_CR77","doi-asserted-by":"publisher","first-page":"70","DOI":"10.1177\/1756829317734837","volume":"10","author":"W Yang","year":"2018","unstructured":"Yang, W., Wang, L., & Song, B. (2018). Dove: A biomimetic flapping-wing micro air vehicle. International Journal of Micro Air Vehicles, 10(1), 70\u201384.","journal-title":"International Journal of Micro Air Vehicles"},{"issue":"5","key":"1937_CR78","doi-asserted-by":"publisher","first-page":"1141","DOI":"10.1007\/s11263-019-01266-1","volume":"128","author":"H Yu","year":"2020","unstructured":"Yu, H., Li, G., Zhang, W., Huang, Q., Du, D., Tian, Q., & Sebe, N. (2020). The unmanned aerial vehicle benchmark: Object detection, tracking and baseline. International Journal of Computer Vision, 128(5), 1141\u20131159.","journal-title":"International Journal of Computer Vision"},{"issue":"2","key":"1937_CR79","doi-asserted-by":"publisher","DOI":"10.1088\/1748-3190\/aa58d3","volume":"12","author":"C Zhang","year":"2017","unstructured":"Zhang, C., & Rossi, C. (2017). A review of compliant transmission mechanisms for bio-inspired flapping-wing micro air vehicles. Bioinspiration & Biomimetics, 12(2), 025005.","journal-title":"Bioinspiration & Biomimetics"},{"key":"1937_CR80","doi-asserted-by":"crossref","unstructured":"Zhang, Z., & Peng, H. (2019). Deeper and wider siamese networks for real-time visual tracking. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition (pp. 4591\u20134600).","DOI":"10.1109\/CVPR.2019.00472"},{"key":"1937_CR81","doi-asserted-by":"crossref","unstructured":"Zhang, Z., Peng, H., Fu, J., Li, B., & Hu, W. (2020). Ocean: Object-aware anchor-free tracking. In European conference on computer vision (pp. 771\u2013787). Springer.","DOI":"10.1007\/978-3-030-58589-1_46"},{"key":"1937_CR82","doi-asserted-by":"crossref","unstructured":"Zheng, Z., Wang, P., Liu, W., Li, J., Ye, R., & Ren, D. (2020). Distance-iou loss: Faster and better learning for bounding box regression. In Proceedings of the AAAI conference on artificial intelligence (Vol. 34, pp. 12993\u201313000).","DOI":"10.1609\/aaai.v34i07.6999"},{"issue":"11","key":"1937_CR83","doi-asserted-by":"publisher","first-page":"7380","DOI":"10.1109\/TPAMI.2021.3119563","volume":"44","author":"P Zhu","year":"2021","unstructured":"Zhu, P., Wen, L., Du, D., Bian, X., Fan, H., Hu, Q., & Ling, H. (2021). Detection and tracking meet drones challenge. IEEE Transactions on Pattern Analysis and Machine Intelligence, 44(11), 7380\u20137399.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"1937_CR84","doi-asserted-by":"crossref","unstructured":"Zhu, Z., Wang, Q., Li, B., Wu, W., Yan, J., & Hu, W. (2018). Distractor-aware siamese networks for visual object tracking. In Proceedings of the European conference on computer vision (ECCV) (pp. 101\u2013117).","DOI":"10.1007\/978-3-030-01240-3_7"}],"container-title":["International Journal of Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-023-01937-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11263-023-01937-0\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-023-01937-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,5,7]],"date-time":"2024-05-07T08:14:57Z","timestamp":1715069697000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11263-023-01937-0"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,12,2]]},"references-count":84,"journal-issue":{"issue":"5","published-print":{"date-parts":[[2024,5]]}},"alternative-id":["1937"],"URL":"https:\/\/doi.org\/10.1007\/s11263-023-01937-0","relation":{},"ISSN":["0920-5691","1573-1405"],"issn-type":[{"value":"0920-5691","type":"print"},{"value":"1573-1405","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,12,2]]},"assertion":[{"value":"16 December 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 October 2023","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 December 2023","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"All authors declare no conflicts of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}},{"value":"The toolkit and experimental results will be made publicly available.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Code availability"}}]}}