{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,4]],"date-time":"2026-03-04T08:27:03Z","timestamp":1772612823575,"version":"3.50.1"},"reference-count":50,"publisher":"Springer Science and Business Media LLC","issue":"11","license":[{"start":{"date-parts":[[2024,1,29]],"date-time":"2024-01-29T00:00:00Z","timestamp":1706486400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,1,29]],"date-time":"2024-01-29T00:00:00Z","timestamp":1706486400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100009110","name":"Natural Science Foundation of Xinjiang Uygur Autonomous Region","doi-asserted-by":"crossref","id":[{"id":"10.13039\/100009110","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Vis Comput"],"published-print":{"date-parts":[[2024,11]]},"DOI":"10.1007\/s00371-023-03226-w","type":"journal-article","created":{"date-parts":[[2024,1,29]],"date-time":"2024-01-29T10:02:34Z","timestamp":1706522554000},"page":"8113-8124","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":22,"title":["Multi-directional guidance network for fine-grained visual classification"],"prefix":"10.1007","volume":"40","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-3010-1622","authenticated-orcid":false,"given":"Shengying","family":"Yang","sequence":"first","affiliation":[]},{"given":"Yao","family":"Jin","sequence":"additional","affiliation":[]},{"given":"Jingsheng","family":"Lei","sequence":"additional","affiliation":[]},{"given":"Shuping","family":"Zhang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,1,29]]},"reference":[{"key":"3226_CR1","unstructured":"Wah, C., Branson, S., Welinder, P., Perona, P., Belongie, S.: The caltech-ucsd birds-200-2011 dataset (2011)"},{"key":"3226_CR2","doi-asserted-by":"publisher","DOI":"10.3389\/fpls.2020.600854","volume":"11","author":"G Yang","year":"2020","unstructured":"Yang, G., He, Y., Yang, Y., Xu, B.: Fine-grained image classification for crop disease based on attention mechanism. Front. Plant Sci. 11, 600854 (2020)","journal-title":"Front. Plant Sci."},{"key":"3226_CR3","doi-asserted-by":"crossref","unstructured":"Zhang, N., Donahue, J., Girshick, R., Darrell, T.: Part-based r-cnns for fine-grained category detection. In: Computer Vision-ECCV 2014: 13th European Conference, Zurich, Switzerland, September 6\u201312, 2014, Proceedings, Part I 13, pp. 834\u2013849. Springer (2014)","DOI":"10.1007\/978-3-319-10590-1_54"},{"key":"3226_CR4","doi-asserted-by":"crossref","unstructured":"Huang, S., Xu, Z., Tao, D., Zhang, Y.: Part-stacked cnn for fine-grained visual categorization. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1173\u20131182 (2016)","DOI":"10.1109\/CVPR.2016.132"},{"key":"3226_CR5","doi-asserted-by":"crossref","unstructured":"Lin, D., Shen, X., Lu, C., Jia, J.: Deep lac: Deep localization, alignment and classification for fine-grained recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1666\u20131674 (2015)","DOI":"10.1109\/CVPR.2015.7298775"},{"key":"3226_CR6","doi-asserted-by":"publisher","first-page":"476","DOI":"10.1109\/TIP.2019.2921876","volume":"29","author":"H Zheng","year":"2019","unstructured":"Zheng, H., Fu, J., Zha, Z.-J., Luo, J., Mei, T.: Learning rich part hierarchies with progressive attention networks for fine-grained image recognition. IEEE Trans. Image Process. 29, 476\u2013488 (2019)","journal-title":"IEEE Trans. Image Process."},{"key":"3226_CR7","doi-asserted-by":"crossref","unstructured":"Zhang, T., Chang, D., Ma, Z., Guo, J.: Progressive co-attention network for fine-grained visual classification. In: 2021 International Conference on Visual Communications and Image Processing (VCIP), pp. 1\u20135. IEEE (2021)","DOI":"10.1109\/VCIP53242.2021.9675376"},{"key":"3226_CR8","doi-asserted-by":"crossref","unstructured":"Ding, Y., Zhou, Y., Zhu, Y., Ye, Q., Jiao, J.: Selective sparse sampling for fine-grained image recognition. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 6599\u20136608 (2019)","DOI":"10.1109\/ICCV.2019.00670"},{"key":"3226_CR9","doi-asserted-by":"crossref","unstructured":"Zhang, L., Huang, S., Liu, W., Tao, D.: Learning a mixture of granularity-specific experts for fine-grained categorization. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 8331\u20138340 (2019)","DOI":"10.1109\/ICCV.2019.00842"},{"key":"3226_CR10","doi-asserted-by":"crossref","unstructured":"Xiao, T., Xu, Y., Yang, K., Zhang, J., Peng, Y., Zhang, Z.: The application of two-level attention models in deep convolutional neural network for fine-grained image classification. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 842\u2013850 (2015)","DOI":"10.1109\/CVPR.2015.7298685"},{"key":"3226_CR11","doi-asserted-by":"crossref","unstructured":"Yang, Z., Luo, T., Wang, D., Hu, Z., Gao, J., Wang, L.: Learning to navigate for fine-grained classification. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 420\u2013435 (2018)","DOI":"10.1007\/978-3-030-01264-9_26"},{"key":"3226_CR12","doi-asserted-by":"crossref","unstructured":"Ge, W., Lin, X., Yu, Y.: Weakly supervised complementary parts models for fine-grained image classification from the bottom up. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 3034\u20133043 (2019)","DOI":"10.1109\/CVPR.2019.00315"},{"key":"3226_CR13","doi-asserted-by":"crossref","unstructured":"Liu, C., Xie, H., Zha, Z.-J., Ma, L., Yu, L., Zhang, Y.: Filtration and distillation: enhancing region attention for fine-grained visual categorization. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 34, pp. 11555\u201311562 (2020)","DOI":"10.1609\/aaai.v34i07.6822"},{"key":"3226_CR14","doi-asserted-by":"crossref","unstructured":"Sun, M., Yuan, Y., Zhou, F., Ding, E.: Multi-attention multi-class constraint for fine-grained image recognition. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 805\u2013821 (2018)","DOI":"10.1007\/978-3-030-01270-0_49"},{"key":"3226_CR15","doi-asserted-by":"crossref","unstructured":"Zheng, H., Fu, J., Mei, T., Luo, J.: Learning multi-attention convolutional neural network for fine-grained image recognition. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 5209\u20135217 (2017)","DOI":"10.1109\/ICCV.2017.557"},{"key":"3226_CR16","doi-asserted-by":"crossref","unstructured":"Fu, J., Zheng, H., Mei, T.: Look closer to see better: Recurrent attention convolutional neural network for fine-grained image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4438\u20134446 (2017)","DOI":"10.1109\/CVPR.2017.476"},{"key":"3226_CR17","doi-asserted-by":"crossref","unstructured":"He, J., Chen, J.-N., Liu, S., Kortylewski, A., Yang, C., Bai, Y., Wang, C.: Transfg: A transformer architecture for fine-grained recognition. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 36, pp. 852\u2013860 (2022)","DOI":"10.1609\/aaai.v36i1.19967"},{"key":"3226_CR18","unstructured":"Wang, J., Yu, X., Gao, Y.: Feature fusion vision transformer for fine-grained visual categorization. arXiv:2107.02341 (2021)"},{"key":"3226_CR19","doi-asserted-by":"crossref","unstructured":"Lin, T.-Y., RoyChowdhury, A., Maji, S.: Bilinear cnn models for fine-grained visual recognition. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1449\u20131457 (2015)","DOI":"10.1109\/ICCV.2015.170"},{"key":"3226_CR20","doi-asserted-by":"crossref","unstructured":"Kong, S., Fowlkes, C.: Low-rank bilinear pooling for fine-grained classification. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 365\u2013374 (2017)","DOI":"10.1109\/CVPR.2017.743"},{"key":"3226_CR21","doi-asserted-by":"crossref","unstructured":"Li, P., Xie, J., Wang, Q., Gao, Z.: Towards faster training of global covariance pooling networks by iterative matrix square root normalization. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 947\u2013955 (2018)","DOI":"10.1109\/CVPR.2018.00105"},{"key":"3226_CR22","doi-asserted-by":"crossref","unstructured":"Liao, Q., Wang, D., Holewa, H., Xu, M.: Squeezed bilinear pooling for fine-grained visual categorization. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision Workshops, pp. 0\u20130 (2019)","DOI":"10.1109\/ICCVW.2019.00093"},{"key":"3226_CR23","doi-asserted-by":"crossref","unstructured":"Shi, X., Xu, L., Wang, P., Gao, Y., Jian, H., Liu, W.: Beyond the attention: Distinguish the discriminative and confusable features for fine-grained image classification. In: Proceedings of the 28th ACM International Conference on Multimedia, pp. 601\u2013609 (2020)","DOI":"10.1145\/3394171.3413883"},{"key":"3226_CR24","doi-asserted-by":"crossref","unstructured":"Gao, Y., Beijbom, O., Zhang, N., Darrell, T.: Compact bilinear pooling. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 317\u2013326 (2016)","DOI":"10.1109\/CVPR.2016.41"},{"key":"3226_CR25","doi-asserted-by":"crossref","unstructured":"Yu, C., Zhao, X., Zheng, Q., Zhang, P., You, X.: Hierarchical bilinear pooling for fine-grained visual recognition. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 574\u2013589 (2018)","DOI":"10.1007\/978-3-030-01270-0_35"},{"key":"3226_CR26","doi-asserted-by":"crossref","unstructured":"Zhuang, P., Wang, Y., Qiao, Y.: Learning attentive pairwise interaction for fine-grained classification. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 34, pp. 13130\u201313137 (2020)","DOI":"10.1609\/aaai.v34i07.7016"},{"key":"3226_CR27","doi-asserted-by":"crossref","unstructured":"Gao, Y., Han, X., Wang, X., Huang, W., Scott, M.: Channel interaction networks for fine-grained image categorization. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 34, pp. 10818\u201310825 (2020)","DOI":"10.1609\/aaai.v34i07.6712"},{"key":"3226_CR28","doi-asserted-by":"crossref","unstructured":"Lin, T.-Y., Doll\u00e1r, P., Girshick, R., He, K., Hariharan, B., Belongie, S.: Feature pyramid networks for object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2117\u20132125 (2017)","DOI":"10.1109\/CVPR.2017.106"},{"key":"3226_CR29","unstructured":"Li, H., Xiong, P., An, J., Wang, L.: Pyramid attention network for semantic segmentation. arXiv:1805.10180 (2018)"},{"key":"3226_CR30","doi-asserted-by":"crossref","unstructured":"Liu, W., Anguelov, D., Erhan, D., Szegedy, C., Reed, S., Fu, C.-Y., Berg, A.C.: Ssd: Single shot multibox detector. In: Computer Vision\u2013ECCV 2016: 14th European Conference, Amsterdam, The Netherlands, October 11\u201314, 2016, Proceedings, Part I 14, pp. 21\u201337. Springer (2016)","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"3226_CR31","doi-asserted-by":"crossref","unstructured":"Chen, X., Fu, C., Zhao, Y., Zheng, F., Song, J., Ji, R., Yang, Y.: Salience-guided cascaded suppression network for person re-identification. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 3300\u20133310 (2020)","DOI":"10.1109\/CVPR42600.2020.00336"},{"key":"3226_CR32","doi-asserted-by":"crossref","unstructured":"Chang, D., Pang, K., Zheng, Y., Ma, Z., Song, Y.-Z., Guo, J.: Your\" flamingo\" is my\" bird\": fine-grained, or not. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 11476\u201311485 (2021)","DOI":"10.1109\/CVPR46437.2021.01131"},{"issue":"7","key":"3226_CR33","doi-asserted-by":"publisher","first-page":"2686","DOI":"10.1109\/TCSVT.2020.3027616","volume":"31","author":"J Lei","year":"2020","unstructured":"Lei, J., Li, X., Peng, B., Fang, L., Ling, N., Huang, Q.: Deep spatial-spectral subspace clustering for hyperspectral image. IEEE Trans. Circuits Syst. Video Technol. 31(7), 2686\u20132697 (2020)","journal-title":"IEEE Trans. Circuits Syst. Video Technol."},{"issue":"6","key":"3226_CR34","doi-asserted-by":"publisher","first-page":"2721","DOI":"10.1109\/TIP.2017.2686017","volume":"26","author":"X Song","year":"2017","unstructured":"Song, X., Jiang, S., Herranz, L.: Multi-scale multi-feature context modeling for scene recognition in the semantic manifold. IEEE Trans. Image Process. 26(6), 2721\u20132735 (2017)","journal-title":"IEEE Trans. Image Process."},{"key":"3226_CR35","doi-asserted-by":"publisher","first-page":"265","DOI":"10.1109\/TIP.2019.2929447","volume":"29","author":"S Jiang","year":"2019","unstructured":"Jiang, S., Min, W., Liu, L., Luo, Z.: Multi-scale multi-view deep feature aggregation for food recognition. IEEE Trans. Image Process. 29, 265\u2013276 (2019)","journal-title":"IEEE Trans. Image Process."},{"key":"3226_CR36","doi-asserted-by":"crossref","unstructured":"Long, J., Shelhamer, E., Darrell, T.: Fully convolutional networks for semantic segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 3431\u20133440 (2015)","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"3226_CR37","doi-asserted-by":"crossref","unstructured":"Ronneberger, O., Fischer, P., Brox, T.: U-net: Convolutional networks for biomedical image segmentation. In: Medical Image Computing and Computer-Assisted Intervention\u2013MICCAI 2015: 18th International Conference, Munich, Germany, October 5\u20139, 2015, Proceedings, Part III 18, pp. 234\u2013241. Springer (2015)","DOI":"10.1007\/978-3-319-24574-4_28"},{"key":"3226_CR38","doi-asserted-by":"crossref","unstructured":"Kong, T., Yao, A., Chen, Y., Sun, F.: Hypernet: Towards accurate region proposal generation and joint object detection. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 845\u2013853 (2016)","DOI":"10.1109\/CVPR.2016.98"},{"key":"3226_CR39","doi-asserted-by":"crossref","unstructured":"Yang, Z., Luo, T., Wang, D., Hu, Z., Gao, J., Wang, L.: Learning to navigate for fine-grained classification. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 420\u2013435 (2018)","DOI":"10.1007\/978-3-030-01264-9_26"},{"key":"3226_CR40","doi-asserted-by":"crossref","unstructured":"Zeiler, M.D., Fergus, R.: Visualizing and understanding convolutional networks. In: Computer Vision\u2013ECCV 2014: 13th European Conference, Zurich, Switzerland, September 6-12, 2014, Proceedings, Part I 13, pp. 818\u2013833. Springer (2014)","DOI":"10.1007\/978-3-319-10590-1_53"},{"key":"3226_CR41","doi-asserted-by":"crossref","unstructured":"Krause, J., Stark, M., Deng, J., Fei-Fei, L.: 3d object representations for fine-grained categorization. In: Proceedings of the IEEE International Conference on Computer Vision Workshops, pp. 554\u2013561 (2013)","DOI":"10.1109\/ICCVW.2013.77"},{"key":"3226_CR42","unstructured":"Maji, S., Rahtu, E., Kannala, J., Blaschko, M., Vedaldi, A.: Fine-grained visual classification of aircraft. arXiv:1306.5151 (2013)"},{"key":"3226_CR43","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"3226_CR44","doi-asserted-by":"crossref","unstructured":"Zheng, H., Fu, J., Zha, Z.-J., Luo, J.: Looking for the devil in the details: Learning trilinear attention sampling network for fine-grained image recognition. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5012\u20135021 (2019)","DOI":"10.1109\/CVPR.2019.00515"},{"key":"3226_CR45","doi-asserted-by":"crossref","unstructured":"Zare, M., Ghasemi, M., Zahedi, A., Golalipour, K., Mohammadi, S.K., Mirjalili, S., Abualigah, L.: A global best-guided firefly algorithm for engineering problems. J. Bionic Eng. 1\u201330 (2023)","DOI":"10.1007\/s42235-023-00386-2"},{"issue":"5","key":"3226_CR46","doi-asserted-by":"publisher","first-page":"4099","DOI":"10.1007\/s00521-022-07854-6","volume":"35","author":"JO Agushaka","year":"2023","unstructured":"Agushaka, J.O., Ezugwu, A.E., Abualigah, L.: Gazelle optimization algorithm: a novel nature-inspired metaheuristic optimizer. Neural Comput. Appl. 35(5), 4099\u20134131 (2023)","journal-title":"Neural Comput. Appl."},{"key":"3226_CR47","doi-asserted-by":"publisher","DOI":"10.1016\/j.aei.2023.102004","volume":"57","author":"G Hu","year":"2023","unstructured":"Hu, G., Zheng, Y., Abualigah, L., Hussien, A.G.: Detdo: an adaptive hybrid dandelion optimizer for engineering optimization. Adv. Eng. Inform. 57, 102004 (2023)","journal-title":"Adv. Eng. Inform."},{"key":"3226_CR48","doi-asserted-by":"crossref","unstructured":"Luo, W., Yang, X., Mo, X., Lu, Y., Davis, L.S., Li, J., Yang, J., Lim, S.-N.: Cross-x learning for fine-grained visual categorization. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 8242\u20138251 (2019)","DOI":"10.1109\/ICCV.2019.00833"},{"key":"3226_CR49","doi-asserted-by":"crossref","unstructured":"Chen, Y., Bai, Y., Zhang, W., Mei, T.: Destruction and construction learning for fine-grained image recognition. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5157\u20135166 (2019)","DOI":"10.1109\/CVPR.2019.00530"},{"key":"3226_CR50","doi-asserted-by":"publisher","first-page":"4683","DOI":"10.1109\/TIP.2020.2973812","volume":"29","author":"D Chang","year":"2020","unstructured":"Chang, D., Ding, Y., Xie, J., Bhunia, A.K., Li, X., Ma, Z., Wu, M., Guo, J., Song, Y.-Z.: The devil is in the channels: mutual-channel loss for fine-grained image classification. IEEE Trans. Image Process. 29, 4683\u20134695 (2020)","journal-title":"IEEE Trans. Image Process."}],"container-title":["The Visual Computer"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-023-03226-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00371-023-03226-w\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-023-03226-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,6]],"date-time":"2024-11-06T16:15:33Z","timestamp":1730909733000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00371-023-03226-w"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,1,29]]},"references-count":50,"journal-issue":{"issue":"11","published-print":{"date-parts":[[2024,11]]}},"alternative-id":["3226"],"URL":"https:\/\/doi.org\/10.1007\/s00371-023-03226-w","relation":{},"ISSN":["0178-2789","1432-2315"],"issn-type":[{"value":"0178-2789","type":"print"},{"value":"1432-2315","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,1,29]]},"assertion":[{"value":"2 December 2023","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"29 January 2024","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}