{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,6]],"date-time":"2026-06-06T17:08:37Z","timestamp":1780765717669,"version":"3.54.1"},"reference-count":73,"publisher":"Springer Science and Business Media LLC","issue":"9","license":[{"start":{"date-parts":[[2025,5,25]],"date-time":"2025-05-25T00:00:00Z","timestamp":1748131200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,5,25]],"date-time":"2025-05-25T00:00:00Z","timestamp":1748131200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Comput Vis"],"published-print":{"date-parts":[[2025,9]]},"DOI":"10.1007\/s11263-025-02486-4","type":"journal-article","created":{"date-parts":[[2025,5,25]],"date-time":"2025-05-25T05:42:07Z","timestamp":1748151727000},"page":"6108-6128","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":8,"title":["PointOBB-v3: Expanding Performance Boundaries of Single Point-Supervised Oriented Object Detection"],"prefix":"10.1007","volume":"133","author":[{"given":"Peiyuan","family":"Zhang","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Junwei","family":"Luo","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Xue","family":"Yang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yi","family":"Yu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Qingyun","family":"Li","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yue","family":"Zhou","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Xiaosong","family":"Jia","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Xudong","family":"Lu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jingdong","family":"Chen","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Xiang","family":"Li","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Junchi","family":"Yan","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8203-1246","authenticated-orcid":false,"given":"Yansheng","family":"Li","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2025,5,25]]},"reference":[{"key":"2486_CR1","doi-asserted-by":"crossref","unstructured":"Bearman, A., Russakovsky, O., Ferrari, V., & Fei-Fei, L. What\u2019s the point: Semantic segmentation with point supervision. In: European Conference on Computer Vision, pp. 549\u2013565 (2016). Springer.","DOI":"10.1007\/978-3-319-46478-7_34"},{"key":"2486_CR2","doi-asserted-by":"crossref","unstructured":"Bilen, H., & Vedaldi, A. Weakly supervised deep detection networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2846\u20132854 (2016).","DOI":"10.1109\/CVPR.2016.311"},{"key":"2486_CR3","doi-asserted-by":"crossref","unstructured":"Bilen, H., & Vedaldi, A. Weakly supervised deep detection networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2846\u20132854 (2016).","DOI":"10.1109\/CVPR.2016.311"},{"key":"2486_CR4","doi-asserted-by":"crossref","unstructured":"Chen, Z., Fu, Z., Jiang, R., Chen, Y., & Hua, X.-S. Slv: Spatial likelihood voting for weakly supervised object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 12995\u201313004 (2020).","DOI":"10.1109\/CVPR42600.2020.01301"},{"key":"2486_CR5","doi-asserted-by":"crossref","unstructured":"Chen, Z., Fu, Z., Jiang, R., Chen, Y., & Hua, X.-S. Slv: Spatial likelihood voting for weakly supervised object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 12995\u201313004 (2020).","DOI":"10.1109\/CVPR42600.2020.01301"},{"key":"2486_CR6","unstructured":"Chen, K., Wang, J., Pang, J., Cao, Y., Xiong, Y., Li, X., Sun, S., Feng, W., Liu, Z., Xu, J., et al.: Mmdetection: Open mmlab detection toolbox and benchmark. arXiv preprint arXiv:1906.07155 (2019)."},{"key":"2486_CR7","doi-asserted-by":"crossref","unstructured":"Chen, L., Yang, T., Zhang, X., Zhang, W., & Sun, J. Points as queries: Weakly semi-supervised object detection by points. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 8823\u20138832 (2021).","DOI":"10.1109\/CVPR46437.2021.00871"},{"key":"2486_CR8","doi-asserted-by":"crossref","unstructured":"Chen, P., Yu, X., Han, X., Hassan, N., Wang, K., Li, J., Zhao, J., Shi, H., Han, Z., & Ye, Q. Point-to-box network for accurate object detection via single point supervision. In: European Conference on Computer Vision, pp. 51\u201367 (2022). Springer.","DOI":"10.1007\/978-3-031-20077-9_4"},{"key":"2486_CR9","doi-asserted-by":"crossref","unstructured":"Cheng, B., Parkhi, O., & Kirillov, A. Pointly-supervised instance segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2617\u20132626 (2022).","DOI":"10.1109\/CVPR52688.2022.00264"},{"key":"2486_CR10","first-page":"1","volume":"60","author":"G Cheng","year":"2022","unstructured":"Cheng, G., Wang, J., Li, K., Xie, X., Lang, C., Yao, Y., & Han, J. (2022). Anchor-free oriented proposal generator for object detection. IEEE Transactions on Geoscience and Remote Sensing, 60, 1\u201311.","journal-title":"IEEE Transactions on Geoscience and Remote Sensing"},{"key":"2486_CR11","doi-asserted-by":"crossref","unstructured":"Deng, J., Dong, W., Socher, R., Li, L.-J., Li, K., & Fei-Fei, L. Imagenet: A large-scale hierarchical image database. In: 2009 IEEE Conference on Computer Vision and Pattern Recognition, pp. 248\u2013255 (2009). Ieee.","DOI":"10.1109\/CVPR.2009.5206848"},{"issue":"1\u20132","key":"2486_CR12","doi-asserted-by":"publisher","first-page":"31","DOI":"10.1016\/S0004-3702(96)00034-3","volume":"89","author":"TG Dietterich","year":"1997","unstructured":"Dietterich, T. G., Lathrop, R. H., & Lozano-P\u00e9rez, T. (1997). Solving the multiple instance problem with axis-parallel rectangles. Artificial intelligence, 89(1\u20132), 31\u201371.","journal-title":"Artificial intelligence"},{"key":"2486_CR13","doi-asserted-by":"crossref","unstructured":"Ding, J., Xue, N., Long, Y., Xia, G.-S., & Lu, Q. Learning roi transformer for oriented object detection in aerial images. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2849\u20132858 (2019).","DOI":"10.1109\/CVPR.2019.00296"},{"key":"2486_CR14","doi-asserted-by":"crossref","unstructured":"Fan, J., Zhang, Z., & Tan, T. Pointly-supervised panoptic segmentation. In: European Conference on Computer Vision, pp. 319\u2013336 (2022). Springer.","DOI":"10.1007\/978-3-031-20056-4_19"},{"key":"2486_CR15","doi-asserted-by":"crossref","unstructured":"Feng, X., Yao, X., Cheng, G., & Han, J. Weakly supervised rotation-invariant aerial object detection network. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 14146\u201314155 (2022).","DOI":"10.1109\/CVPR52688.2022.01375"},{"key":"2486_CR16","doi-asserted-by":"crossref","unstructured":"Feng, X., Yao, X., Cheng, G., & Han, J. Weakly supervised rotation-invariant aerial object detection network. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 14146\u201314155 (2022).","DOI":"10.1109\/CVPR52688.2022.01375"},{"issue":"10","key":"2486_CR17","doi-asserted-by":"publisher","first-page":"11977","DOI":"10.1109\/TPAMI.2023.3275142","volume":"45","author":"X Feng","year":"2023","unstructured":"Feng, X., Yao, X., Shen, H., Cheng, G., Xiao, B., & Han, J. (2023). Learning an invariant and equivariant network for weakly supervised object detection. IEEE Transactions on Pattern Analysis and Machine Intelligence, 45(10), 11977\u201311992.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"issue":"10","key":"2486_CR18","doi-asserted-by":"publisher","first-page":"11977","DOI":"10.1109\/TPAMI.2023.3275142","volume":"45","author":"X Feng","year":"2023","unstructured":"Feng, X., Yao, X., Shen, H., Cheng, G., Xiao, B., & Han, J. (2023). Learning an invariant and equivariant network for weakly supervised object detection. IEEE Transactions on Pattern Analysis and Machine Intelligence, 45(10), 11977\u201311992.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2486_CR19","doi-asserted-by":"crossref","unstructured":"Girshick, R., Donahue, J., Darrell, T., & Malik, J. Rich feature hierarchies for accurate object detection and semantic segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 580\u2013587 (2014).","DOI":"10.1109\/CVPR.2014.81"},{"key":"2486_CR20","doi-asserted-by":"crossref","unstructured":"Han, J., Ding, J., Xue, N., & Xia, G.-S. Redet: A rotation-equivariant detector for aerial object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2786\u20132795 (2021).","DOI":"10.1109\/CVPR46437.2021.00281"},{"key":"2486_CR21","first-page":"1","volume":"60","author":"J Han","year":"2021","unstructured":"Han, J., Ding, J., Li, J., & Xia, G.-S. (2021). Align deep features for oriented object detection. IEEE transactions on geoscience and remote sensing, 60, 1\u201311.","journal-title":"IEEE transactions on geoscience and remote sensing"},{"key":"2486_CR22","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., & Sun, J. Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016).","DOI":"10.1109\/CVPR.2016.90"},{"key":"2486_CR23","first-page":"1","volume":"62","author":"S He","year":"2023","unstructured":"He, S., Zou, H., Wang, Y., Li, B., Cao, X., & Jing, N. (2023). Learning remote sensing object detection with single point supervision. IEEE Transactions on Geoscience and Remote Sensing, 62, 1\u20136.","journal-title":"IEEE Transactions on Geoscience and Remote Sensing"},{"key":"2486_CR24","doi-asserted-by":"publisher","first-page":"310","DOI":"10.1016\/j.neucom.2021.01.075","volume":"440","author":"J Iqbal","year":"2021","unstructured":"Iqbal, J., Munir, M. A., Mahmood, A., Ali, A. R., & Ali, M. (2021). Leveraging orientation for weakly supervised object detection with application to firearm localization. Neurocomputing, 440, 310\u2013320.","journal-title":"Neurocomputing"},{"key":"2486_CR25","doi-asserted-by":"crossref","unstructured":"Li, W., Chen, Y., Hu, K., & Zhu, J. Oriented reppoints for aerial object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1829\u20131838 (2022).","DOI":"10.1109\/CVPR52688.2022.00187"},{"key":"2486_CR26","unstructured":"Li, Q., Chen, Y., Shu, X., Chen, D., He, X., Yu, Y., & Yang, X. A simple aerial detection baseline of multimodal language models. arXiv preprint arXiv:2501.09720 (2025)."},{"key":"2486_CR27","doi-asserted-by":"crossref","unstructured":"Li, Y., Hou, Q., Zheng, Z., Cheng, M.-M., Yang, J., & Li, X. Large selective kernel network for remote sensing object detection. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 16794\u201316805 (2023).","DOI":"10.1109\/ICCV51070.2023.01540"},{"key":"2486_CR28","doi-asserted-by":"crossref","unstructured":"Li, W., Liu, W., Zhu, J., Cui, M., Hua, X.-S., & Zhang, L. Box-supervised instance segmentation with level set evolution. In: European Conference on Computer Vision, pp. 1\u201318 (2022). Springer.","DOI":"10.1007\/978-3-031-19818-2_1"},{"key":"2486_CR29","doi-asserted-by":"crossref","unstructured":"Li, Y., Luo, J., Zhang, Y., Tan, Y., Yu, J.-G., & Bai, S. Learning to holistically detect bridges from large-size vhr remote sensing imagery. IEEE Transactions on Pattern Analysis and Machine Intelligence (2024).","DOI":"10.1109\/TPAMI.2024.3393024"},{"key":"2486_CR30","doi-asserted-by":"crossref","unstructured":"Li, W., Yuan, Y., Wang, S., Zhu, J., Li, J., Liu, J., & Zhang, L. Point2mask: Point-supervised panoptic segmentation via optimal transport. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 572\u2013581 (2023).","DOI":"10.1109\/ICCV51070.2023.00059"},{"key":"2486_CR31","doi-asserted-by":"crossref","unstructured":"Liao, M., Zhu, Z., Shi, B., Xia, G.-s., & Bai, X. Rotation-sensitive regression for oriented scene text detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 5909\u20135918 (2018).","DOI":"10.1109\/CVPR.2018.00619"},{"key":"2486_CR32","doi-asserted-by":"crossref","unstructured":"Lin, T.-Y., Doll\u00e1r, P., Girshick, R., He, K., Hariharan, B., & Belongie, S. Feature pyramid networks for object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2117\u20132125 (2017).","DOI":"10.1109\/CVPR.2017.106"},{"key":"2486_CR33","doi-asserted-by":"crossref","unstructured":"Lin, T.-Y., Goyal, P., Girshick, R., He, K., & Doll\u00e1r, P. Focal loss for dense object detection. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 2980\u20132988 (2017).","DOI":"10.1109\/ICCV.2017.324"},{"key":"2486_CR34","doi-asserted-by":"crossref","unstructured":"Liu, X., Liang, D., Yan, S., Chen, D., Qiao, Y., & Yan, J. Fots: Fast oriented text spotting with a unified network. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 5676\u20135685 (2018).","DOI":"10.1109\/CVPR.2018.00595"},{"key":"2486_CR35","doi-asserted-by":"publisher","first-page":"296","DOI":"10.1016\/j.isprsjprs.2019.11.023","volume":"159","author":"K Li","year":"2020","unstructured":"Li, K., Wan, G., Cheng, G., Meng, L., & Han, J. (2020). Object detection in optical remote sensing images: A survey and a new benchmark. ISPRS journal of photogrammetry and remote sensing, 159, 296\u2013307.","journal-title":"ISPRS journal of photogrammetry and remote sensing"},{"issue":"3","key":"2486_CR36","doi-asserted-by":"publisher","first-page":"1832","DOI":"10.1109\/TPAMI.2024.3508072","volume":"47","author":"Y Li","year":"2024","unstructured":"Li, Y., Wang, L., Wang, T., Yang, X., Luo, J., Wang, Q., Deng, Y., Wang, W., Sun, X., Li, H., et al. (2024). Star: A first-ever dataset and a large-scale benchmark for scene graph generation in large-size satellite imagery. IEEE Transactions on Pattern Analysis and Machine Intelligence, 47(3), 1832\u20131849.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2486_CR37","doi-asserted-by":"crossref","unstructured":"Luo, J., Yang, X., Yu, Y., Li, Q., Yan, J., & Li, Y. Pointobb: Learning oriented object detection via single point supervision. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 16730\u201316740 (2024).","DOI":"10.1109\/CVPR52733.2024.01583"},{"key":"2486_CR38","doi-asserted-by":"crossref","unstructured":"Papadopoulos, D.P., Uijlings, J.R., Keller, F., & Ferrari, V. Training object class detectors with click supervision. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 6374\u20136383 (2017).","DOI":"10.1109\/CVPR.2017.27"},{"key":"2486_CR39","doi-asserted-by":"crossref","unstructured":"Papadopoulos, D.P., Uijlings, J.R., Keller, F., & Ferrari, V. Training object class detectors with click supervision. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 6374\u20136383 (2017).","DOI":"10.1109\/CVPR.2017.27"},{"key":"2486_CR40","unstructured":"Ren, B., Yang, X., Yu, Y., Luo, J., & Deng, Z. Pointobb-v2: Towards simpler, faster, and stronger single point supervised oriented object detection. arXiv preprint arXiv:2410.08210 (2024)."},{"key":"2486_CR41","doi-asserted-by":"crossref","unstructured":"Ren, Z., Yu, Z., Yang, X., Liu, M.-Y., Schwing, A.G., & Kautz, J. Ufo 2: A unified framework towards omni-supervised object detection. In: European Conference on Computer Vision, pp. 288\u2013313 (2020). Springer.","DOI":"10.1007\/978-3-030-58529-7_18"},{"key":"2486_CR42","doi-asserted-by":"crossref","unstructured":"Ren, Z., Yu, Z., Yang, X., Liu, M.-Y., Schwing, A.G., & Kautz, J. Ufo 2: A unified framework towards omni-supervised object detection. In: European Conference on Computer Vision, pp. 288\u2013313 (2020). Springer.","DOI":"10.1007\/978-3-030-58529-7_18"},{"key":"2486_CR43","first-page":"7005","volume":"33","author":"Y Shen","year":"2020","unstructured":"Shen, Y., Ji, R., Chen, Z., Wu, Y., & Huang, F. (2020). Uwsod: Toward fully-supervised-level capacity weakly supervised object detection. Advances in Neural Information Processing Systems, 33, 7005\u20137019.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"2486_CR44","doi-asserted-by":"crossref","unstructured":"Sun, Y., Ran, J., Yang, F., Gao, C., Kurozumi, T., Kimata, H., & Ye, Z. Oriented object detection for remote sensing images based on weakly supervised learning. In: 2021 IEEE International Conference on Multimedia & Expo Workshops (ICMEW), pp. 1\u20136 (2021). IEEE","DOI":"10.1109\/ICMEW53276.2021.9455957"},{"key":"2486_CR45","doi-asserted-by":"publisher","first-page":"116","DOI":"10.1016\/j.isprsjprs.2021.12.004","volume":"184","author":"X Sun","year":"2022","unstructured":"Sun, X., Wang, P., Yan, Z., Xu, F., Wang, R., Diao, W., Chen, J., Li, J., Feng, Y., Xu, T., et al. (2022). Fair1m: A benchmark dataset for fine-grained object recognition in high-resolution remote sensing imagery. ISPRS Journal of Photogrammetry and Remote Sensing, 184, 116\u2013130.","journal-title":"ISPRS Journal of Photogrammetry and Remote Sensing"},{"key":"2486_CR46","doi-asserted-by":"crossref","unstructured":"Tang, P., Wang, X., Bai, X., & Liu, W. Multiple instance detection network with online instance classifier refinement. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2843\u20132851 (2017).","DOI":"10.1109\/CVPR.2017.326"},{"key":"2486_CR47","doi-asserted-by":"crossref","unstructured":"Tang, P., Wang, X., Bai, X., & Liu, W. Multiple instance detection network with online instance classifier refinement. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2843\u20132851 (2017).","DOI":"10.1109\/CVPR.2017.326"},{"issue":"1","key":"2486_CR48","doi-asserted-by":"publisher","first-page":"176","DOI":"10.1109\/TPAMI.2018.2876304","volume":"42","author":"P Tang","year":"2018","unstructured":"Tang, P., Wang, X., Bai, S., Shen, W., Bai, X., Liu, W., & Yuille, A. (2018). Pcl: Proposal cluster learning for weakly supervised object detection. IEEE transactions on pattern analysis and machine intelligence, 42(1), 176\u2013191.","journal-title":"IEEE transactions on pattern analysis and machine intelligence"},{"issue":"1","key":"2486_CR49","doi-asserted-by":"publisher","first-page":"176","DOI":"10.1109\/TPAMI.2018.2876304","volume":"42","author":"P Tang","year":"2018","unstructured":"Tang, P., Wang, X., Bai, S., Shen, W., Bai, X., Liu, W., & Yuille, A. (2018). Pcl: Proposal cluster learning for weakly supervised object detection. IEEE transactions on pattern analysis and machine intelligence, 42(1), 176\u2013191.","journal-title":"IEEE transactions on pattern analysis and machine intelligence"},{"key":"2486_CR50","first-page":"1","volume":"61","author":"Z Tan","year":"2023","unstructured":"Tan, Z., Jiang, Z., Guo, C., & Zhang, H. (2023). Wsodet: A weakly supervised oriented detector for aerial object detection. IEEE Transactions on Geoscience and Remote Sensing, 61, 1\u201312.","journal-title":"IEEE Transactions on Geoscience and Remote Sensing"},{"key":"2486_CR51","doi-asserted-by":"crossref","unstructured":"Tian, Z., Shen, C., Wang, X., & Chen, H. Boxinst: High-performance instance segmentation with box annotations. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 5443\u20135452 (2021).","DOI":"10.1109\/CVPR46437.2021.00540"},{"issue":"4","key":"2486_CR52","first-page":"1922","volume":"44","author":"Z Tian","year":"2020","unstructured":"Tian, Z., Shen, C., Chen, H., & He, T. (2020). Fcos: A simple and strong anchor-free object detector. IEEE transactions on pattern analysis and machine intelligence, 44(4), 1922\u20131933.","journal-title":"IEEE transactions on pattern analysis and machine intelligence"},{"key":"2486_CR53","doi-asserted-by":"crossref","unstructured":"Wan, F., Wei, P., Jiao, J., Han, Z., & Ye, Q. Min-entropy latent model for weakly supervised object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1297\u20131306 (2018).","DOI":"10.1109\/CVPR.2018.00141"},{"key":"2486_CR54","doi-asserted-by":"crossref","unstructured":"Xia, G.-S., Bai, X., Ding, J., Zhu, Z., Belongie, S., Luo, J., Datcu, M., Pelillo, M., & Zhang, L. Dota: A large-scale dataset for object detection in aerial images. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 3974\u20133983 (2018).","DOI":"10.1109\/CVPR.2018.00418"},{"key":"2486_CR55","doi-asserted-by":"crossref","unstructured":"Xie, X., Cheng, G., Wang, J., Yao, X., & Han, J. Oriented r-cnn for object detection. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 3520\u20133529 (2021).","DOI":"10.1109\/ICCV48922.2021.00350"},{"issue":"4","key":"2486_CR56","doi-asserted-by":"publisher","first-page":"1452","DOI":"10.1109\/TPAMI.2020.2974745","volume":"43","author":"Y Xu","year":"2020","unstructured":"Xu, Y., Fu, M., Wang, Q., Wang, Y., Chen, K., Xia, G.-S., & Bai, X. (2020). Gliding vertex on the horizontal bounding box for multi-oriented object detection. IEEE transactions on pattern analysis and machine intelligence, 43(4), 1452\u20131459.","journal-title":"IEEE transactions on pattern analysis and machine intelligence"},{"key":"2486_CR57","doi-asserted-by":"crossref","unstructured":"Yang, X., & Yan, J. Arbitrary-oriented object detection with circular smooth label. In: Computer Vision\u2013ECCV 2020: 16th European Conference, Glasgow, UK, August 23\u201328, 2020, Proceedings, Part VIII 16, pp. 677\u2013694 (2020). Springer.","DOI":"10.1007\/978-3-030-58598-3_40"},{"key":"2486_CR58","doi-asserted-by":"crossref","unstructured":"Yang, X., Hou, L., Zhou, Y., Wang, W., & Yan, J. Dense label encoding for boundary discontinuity free rotation detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 15819\u201315829 (2021).","DOI":"10.1109\/CVPR46437.2021.01556"},{"key":"2486_CR59","unstructured":"Yang, X., Yan, J., Ming, Q., Wang, W., Zhang, X., & Tian, Q. Rethinking rotated object detection with gaussian wasserstein distance loss. In: International Conference on Machine Learning, pp. 11830\u201311841 (2021). PMLR."},{"key":"2486_CR60","unstructured":"Yang, X., Zhang, G., Li, W., Wang, X., Zhou, Y., & Yan, J. H2rbox: Horizontal box annotation is all you need for oriented object detection. In: The Eleventh International Conference on Learning Representations (2023)."},{"key":"2486_CR61","doi-asserted-by":"publisher","first-page":"3163","DOI":"10.1609\/aaai.v35i4.16426","volume":"35","author":"X Yang","year":"2021","unstructured":"Yang, X., Yan, J., Feng, Z., & He, T. (2021). R3det: Refined single-stage detector with feature refinement for rotating object. Proceedings of the AAAI Conference on Artificial Intelligence, 35, 3163\u20133171.","journal-title":"Proceedings of the AAAI Conference on Artificial Intelligence"},{"key":"2486_CR62","first-page":"18381","volume":"34","author":"X Yang","year":"2021","unstructured":"Yang, X., Yang, X., Yang, J., Ming, Q., Wang, W., Tian, Q., & Yan, J. (2021). Learning high-precision bounding box for rotated object detection via kullback-leibler divergence. Advances in Neural Information Processing Systems, 34, 18381\u201318394.","journal-title":"Advances in Neural Information Processing Systems"},{"issue":"4","key":"2486_CR63","first-page":"4335","volume":"45","author":"X Yang","year":"2022","unstructured":"Yang, X., Zhang, G., Yang, X., Zhou, Y., Wang, W., Tang, J., He, T., & Yan, J. (2022). Detecting rotated objects as gaussian distributions and its 3-d generalization. IEEE Transactions on Pattern Analysis and Machine Intelligence, 45(4), 4335\u20134354.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2486_CR64","doi-asserted-by":"crossref","unstructured":"Ying, X., Liu, L., Wang, Y., Li, R., Chen, N., Lin, Z., Sheng, W., & Zhou, S. Mapping degeneration meets label evolution: Learning infrared small target detection with single point supervision. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 15528\u201315538 (2023).","DOI":"10.1109\/CVPR52729.2023.01490"},{"key":"2486_CR65","doi-asserted-by":"crossref","unstructured":"Yu, Y., & Da, F. Phase-shifting coder: Predicting accurate orientation in oriented object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 13354\u201313363 (2023).","DOI":"10.1109\/CVPR52729.2023.01283"},{"key":"2486_CR66","doi-asserted-by":"crossref","unstructured":"Yu, X., Chen, P., Wu, D., Hassan, N., Li, G., Yan, J., Shi, H., Ye, Q., & Han, Z. Object localization under single coarse point supervision. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4868\u20134877 (2022).","DOI":"10.1109\/CVPR52688.2022.00482"},{"key":"2486_CR67","doi-asserted-by":"crossref","unstructured":"Yu, Y., Yang, X., Li, Q., Da, F., Dai, J., Qiao, Y., & Yan, J. Point2rbox: Combine knowledge from synthetic visual patterns for end-to-end oriented object detection with single point supervision. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 16783\u201316793 (2024).","DOI":"10.1109\/CVPR52733.2024.01588"},{"key":"2486_CR68","first-page":"59137","volume":"36","author":"Y Yu","year":"2024","unstructured":"Yu, Y., Yang, X., Li, Q., Zhou, Y., Da, F., & Yan, J. (2024). H2rbox-v2: Incorporating symmetry for boosting horizontal box supervised oriented object detection. Advances in Neural Information Processing Systems, 36, 59137\u201359150.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"2486_CR69","doi-asserted-by":"crossref","unstructured":"Zhang, X., Yang, X., Li, Y., Yang, J., Cheng, M.-M., & Li, X. Rsar: Restricted state angle resolver and rotated sar benchmark. arXiv preprint arXiv:2501.04440 (2025).","DOI":"10.1109\/CVPR52734.2025.00695"},{"issue":"9","key":"2486_CR70","first-page":"5866","volume":"44","author":"D Zhang","year":"2021","unstructured":"Zhang, D., Han, J., Cheng, G., & Yang, M.-H. (2021). Weakly supervised object localization and detection: A survey. IEEE transactions on pattern analysis and machine intelligence, 44(9), 5866\u20135885.","journal-title":"IEEE transactions on pattern analysis and machine intelligence"},{"key":"2486_CR71","doi-asserted-by":"crossref","unstructured":"Zhou, Y., Yang, X., Zhang, G., Wang, J., Liu, Y., Hou, L., Jiang, X., Liu, X., Yan, J., Lyu, C., et al.: Mmrotate: A rotated object detection benchmark using pytorch. In: Proceedings of the 30th ACM International Conference on Multimedia. MM \u201922, pp. 7331\u20137334 (2022).","DOI":"10.1145\/3503161.3548541"},{"key":"2486_CR72","first-page":"4","volume":"1","author":"Z-H Zhou","year":"2004","unstructured":"Zhou, Z.-H. (2004). Multi-instance learning: A survey. Department of Computer Science & Technology, Nanjing University. Tech. Rep, 1, 4.","journal-title":"Tech. Rep"},{"key":"2486_CR73","doi-asserted-by":"crossref","unstructured":"Zhu, T., Ferenczi, B., Purkait, P., Drummond, T., Rezatofighi, H., & Van Den\u00a0Hengel, A. Knowledge combination to learn rotated detection without rotated annotation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 15518\u201315527 (2023).","DOI":"10.1109\/CVPR52729.2023.01489"}],"container-title":["International Journal of Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-025-02486-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11263-025-02486-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-025-02486-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,9]],"date-time":"2025-09-09T07:58:38Z","timestamp":1757404718000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11263-025-02486-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,5,25]]},"references-count":73,"journal-issue":{"issue":"9","published-print":{"date-parts":[[2025,9]]}},"alternative-id":["2486"],"URL":"https:\/\/doi.org\/10.1007\/s11263-025-02486-4","relation":{},"ISSN":["0920-5691","1573-1405"],"issn-type":[{"value":"0920-5691","type":"print"},{"value":"1573-1405","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,5,25]]},"assertion":[{"value":"23 January 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 May 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 May 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}