{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,26]],"date-time":"2026-02-26T15:20:57Z","timestamp":1772119257629,"version":"3.50.1"},"reference-count":51,"publisher":"Springer Science and Business Media LLC","issue":"6","license":[{"start":{"date-parts":[[2024,9,26]],"date-time":"2024-09-26T00:00:00Z","timestamp":1727308800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,9,26]],"date-time":"2024-09-26T00:00:00Z","timestamp":1727308800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Vis Comput"],"published-print":{"date-parts":[[2025,4]]},"DOI":"10.1007\/s00371-024-03650-6","type":"journal-article","created":{"date-parts":[[2024,9,26]],"date-time":"2024-09-26T09:02:29Z","timestamp":1727341349000},"page":"4129-4141","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["Improved fine-grained image classification in few-shot learning based on channel-spatial attention and grouped bilinear convolution"],"prefix":"10.1007","volume":"41","author":[{"given":"Ziwei","family":"Zeng","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lihong","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zoufei","family":"Zhao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Qingqing","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2024,9,26]]},"reference":[{"key":"3650_CR1","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2024.110485","volume":"153","author":"XX Li","year":"2024","unstructured":"Li, X.X., Zhen, L., Xie, J.Y., Yang, X.C., Xue, J.H., Ma, Z.Y.: Self-reconstruction network for fine-grained few-shot classification. Pattern Recogn. 153, 110485 (2024)","journal-title":"Pattern Recogn."},{"key":"3650_CR2","doi-asserted-by":"crossref","unstructured":"Yang, L.F., Li, X., Song, R.J., Zhao, B.R., Tao, J.T., Zhou, S.H., Liang, J.J., Yang, J.: Dynamic mlp for fine-grained image classification by leveraging geographical and temporal information. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 10945\u201310954 (2022)","DOI":"10.1109\/CVPR52688.2022.01067"},{"key":"3650_CR3","doi-asserted-by":"crossref","unstructured":"Jiang, J.J., Chen, Z.W., Lei, F.Y., Xu, L., Huang, J.H., Yuan, X.C.: Multi-granularity hypergraph enhanced hierarchical neural network framework for visual classification. Vis. Comput. (2024)","DOI":"10.21203\/rs.3.rs-3985239\/v1"},{"key":"3650_CR4","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/TGRS.2024.3505979","volume":"62","author":"J Zheng","year":"2024","unstructured":"Zheng, J., Li, M., Li, X., Zhang, P., Wu, Y.: Revisiting local and global descriptor-based metric network for few-shot SAR target classification. IEEE Trans. Geosci. Remote Sens. 62, 1\u201314 (2024)","journal-title":"IEEE Trans. Geosci. Remote Sens."},{"issue":"8","key":"3650_CR5","doi-asserted-by":"publisher","first-page":"10422","DOI":"10.1109\/TNNLS.2023.3241919","volume":"35","author":"H Cheng","year":"2023","unstructured":"Cheng, H., Wang, Y.F., Li, H.L., Kot, A.C., Wen, B.H.: Disentangled feature representation for few-shot image classification. IEEE Trans. Neural Netw. Learn. Syst. 35(8), 10422\u201310435 (2023)","journal-title":"IEEE Trans. Neural Netw. Learn. Syst."},{"key":"3650_CR6","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2023.110477","volume":"268","author":"TY Xia","year":"2023","unstructured":"Xia, T.Y., Liao, B.W., Tian, Y.: Few-shot relation classification using clustering-based prototype modification. Knowl.-Based Syst. 268, 110477 (2023)","journal-title":"Knowl.-Based Syst."},{"key":"3650_CR7","doi-asserted-by":"crossref","unstructured":"Sung, F., Yang, Y.X., Zhang,L., Xiang, T., Torr, P.H.S., Hospedales, T.M.: Learning to compare: relation network for few-shot learning. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1199\u20131208 (2018)","DOI":"10.1109\/CVPR.2018.00131"},{"issue":"12","key":"3650_CR8","doi-asserted-by":"publisher","first-page":"7530","DOI":"10.1109\/TCSVT.2023.3275382","volume":"33","author":"X Li","year":"2023","unstructured":"Li, X., Song, Q., Wu, J., Zhu, R., Ma, Z., Xue, J.H.: Locally-enriched cross-reconstruction for few-shot fine-grained image classification. IEEE Trans. Circ. Syst. Video Technol. 33(12), 7530\u20137540 (2023)","journal-title":"IEEE Trans. Circ. Syst. Video Technol."},{"key":"3650_CR9","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2023.121436","volume":"237","author":"J Zhang","year":"2024","unstructured":"Zhang, J., Slamu, W.: Partial channel pooling attention beats convolutional attention. Expert Syst. Appl. 237, 121436 (2024)","journal-title":"Expert Syst. Appl."},{"issue":"3","key":"3650_CR10","doi-asserted-by":"publisher","DOI":"10.1007\/s11432-021-3493-7","volume":"66","author":"G Cheng","year":"2023","unstructured":"Cheng, G., Lai, P.J., Gao, D.H., Han, J.W.: Class attention network for image recognition. Sci. China Inf. Sci. 66(3), 132105 (2023)","journal-title":"Sci. China Inf. Sci."},{"key":"3650_CR11","doi-asserted-by":"crossref","unstructured":"Lee, K., Maji, S., Ravichandran, A., Soatto, S.: Meta-learning with differentiable convex optimization. In: Proceedings of the IEEE\/CVF Conference on Computer vision and Pattern Recognition, pp. 10657\u201310665 (2019)","DOI":"10.1109\/CVPR.2019.01091"},{"key":"3650_CR12","doi-asserted-by":"publisher","DOI":"10.1016\/j.engappai.2023.107296","volume":"127","author":"JF Jia","year":"2024","unstructured":"Jia, J.F., Feng, X., Yu, H.Q.: Few-shot classification via efficient meta-learning with hybrid optimization. Eng. Appl. Artif. Intell. 127, 107296 (2024)","journal-title":"Eng. Appl. Artif. Intell."},{"key":"3650_CR13","unstructured":"Finn, C., Abbeel, P., Levine, S.: Model-agnostic meta-learning for fast adaptation of deep networks. In: International Conference on Machine Learning, pp. 1126\u20131135. PMLR (2017)"},{"key":"3650_CR14","doi-asserted-by":"crossref","unstructured":"Osahor, U.M., Nasrabadi, N.M.: Ortho-shot: low displacement rank regularization with data augmentation for few-shot learning. In: CVF Winter Conference on Applications of Computer Vision (WACV), pp. 2040\u20132049 (2021)","DOI":"10.1109\/WACV51458.2022.00210"},{"key":"3650_CR15","first-page":"1","volume":"60","author":"MG Gong","year":"2022","unstructured":"Gong, M.G., Li, J.Z., Zhang, Y.R., Wu, Y., Zhang, M.Y.: Two-path aggregation attention network with quad-patch data augmentation for few-shot scene classification. IEEE Trans. Geosci. Remote Sens. 60, 1\u201316 (2022)","journal-title":"IEEE Trans. Geosci. Remote Sens."},{"key":"3650_CR16","doi-asserted-by":"crossref","unstructured":"Zhang, Y.R., Gong, M.G., Li, J.Z., Feng, K.Y., Zhang, M.Y.: Few-shot learning with enhancements to data augmentation and feature extraction. IEEE Trans. Neural Netw. Learn. Syst. (2024)","DOI":"10.1109\/TNNLS.2024.3400592"},{"key":"3650_CR17","doi-asserted-by":"crossref","unstructured":"Wang, X.X., Wang, X., Jiang, B., Luo, B.: Few-shot learning meets transformer: unified query-support transformers for few-shot classification. IEEE Trans. Circ. Syst. Video Technol. (2023)","DOI":"10.1109\/TCSVT.2023.3282777"},{"key":"3650_CR18","doi-asserted-by":"crossref","unstructured":"Zhang, C., Cai, Y.J., Lin, G.S., Shen, C.H.: Deepemd: few-shot image classification with differentiable earth mover's distance and structured classifiers. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 12203\u201312213 (2020)","DOI":"10.1109\/CVPR42600.2020.01222"},{"key":"3650_CR19","doi-asserted-by":"crossref","unstructured":"Li, W., Wang, L., Xu, J., Huo, J., Gao, Y., Luo, J.: Revisiting local descriptor based image-to-class measure for few-shot learning. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 7260\u20137268 (2019)","DOI":"10.1109\/CVPR.2019.00743"},{"key":"3650_CR20","unstructured":"Snell, Jake, Swersky, K., Zemel, R.: Prototypical networks for few-shot learning. Adv. Neural Inf. Process. Syst. 30 (2017)."},{"key":"3650_CR21","doi-asserted-by":"crossref","unstructured":"Kang, D., Kwon, H., Min, J.H., Cho, M.S.: Relational embedding for few-shot classification. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 8822\u20138833 2021","DOI":"10.1109\/ICCV48922.2021.00870"},{"issue":"3","key":"3650_CR22","doi-asserted-by":"publisher","first-page":"1091","DOI":"10.1109\/TCSVT.2020.2995754","volume":"31","author":"W Jiang","year":"2020","unstructured":"Jiang, W., Huang, K., Geng, J., Deng, X.Y.: Multi-scale metric learning for few-shot learning. IEEE Trans. Circ. Syst. Video Technol. 31(3), 1091\u20131102 (2020)","journal-title":"IEEE Trans. Circ. Syst. Video Technol."},{"key":"3650_CR23","doi-asserted-by":"publisher","first-page":"50","DOI":"10.1109\/TMM.2021.3120873","volume":"25","author":"X Lin","year":"2023","unstructured":"Lin, X., Sun, S., Huang, W., Sheng, B., Li, P., Feng, D.D.: EAPT: efficient attention pyramid transformer for image processing. IEEE Trans. Multimedia 25, 50\u201361 (2023)","journal-title":"IEEE Trans. Multimedia"},{"issue":"2","key":"3650_CR24","first-page":"1931","volume":"37","author":"WJ Moon","year":"2023","unstructured":"Moon, W.J., Seong, H.S., Heo, J.P.: Minority-oriented vicinity expansion with attentive aggregation for video long-tailed recognition. Proc. AAAI Conf. AI 37(2), 1931\u20131939 (2023)","journal-title":"Proc. AAAI Conf. AI"},{"key":"3650_CR25","doi-asserted-by":"crossref","unstructured":"Shim, S.H., Hyun, S., Bae, D.H., Heo, J.P.: Local attention pyramid for scene image generation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 7774\u20137782 (2022)","DOI":"10.1109\/CVPR52688.2022.00762"},{"key":"3650_CR26","unstructured":"Ramachandran, P., Parmar, N., Vaswani, A., Bello, I., Levskaya, A., Shlens, J.: Stand-alone self-attention in vision models. Adv. Neural Inf. Process. Syst. 32 (2019)"},{"key":"3650_CR27","doi-asserted-by":"publisher","first-page":"1903","DOI":"10.1109\/JSTARS.2023.3341338","volume":"17","author":"SX Xia","year":"2023","unstructured":"Xia, S.X., Zhang, X.H., Meng, H.Y., Fan, J.X., Jiao, L.C.: Two-stream networks for contrastive learning in hyperspectral image classification. IEEE J. Sel. Top. Appl. Earth Observ. Remote Sens. 17, 1903\u20131920 (2023)","journal-title":"IEEE J. Sel. Top. Appl. Earth Observ. Remote Sens."},{"key":"3650_CR28","doi-asserted-by":"crossref","unstructured":"Hu, J., Shen, L., Sun, G.: Squeeze-and-excitation networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 7132\u20137141 (2018)","DOI":"10.1109\/CVPR.2018.00745"},{"key":"3650_CR29","doi-asserted-by":"crossref","unstructured":"Woo, S., Park, J., Lee, J.Y., Kweon, I.S.: Cbam: convolutional block attention module. In Proceedings of the European conference on computer vision (ECCV), pp. 3\u201319 (2018)","DOI":"10.1007\/978-3-030-01234-2_1"},{"key":"3650_CR30","unstructured":"Dosovitskiy, A., Beyer, L., Kolesnikov, A., Weissenborn, D., Zhai, X.H., Unterthiner, T., Dehghani, M. et al.: An image is worth 16\u2009\u00d7\u200916 words: Transformers for image recognition at scale. (2020)"},{"key":"3650_CR31","doi-asserted-by":"crossref","unstructured":"Lin, T.Y., Aruni, R.C., Maji, S.: Bilinear CNN models for fine-grained visual recognition. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1449\u20131457 (2015)","DOI":"10.1109\/ICCV.2015.170"},{"key":"3650_CR32","doi-asserted-by":"crossref","unstructured":"Kong, S., Fowlkes, S.: Low-rank bilinear pooling for fine-grained classification. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 365\u2013374 (2017)","DOI":"10.1109\/CVPR.2017.743"},{"key":"3650_CR33","doi-asserted-by":"crossref","unstructured":"Gao, Y., Beijbom, O., Zhang, N., Darrell, T.: Compact bilinear pooling. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 317\u2013326 (2016)","DOI":"10.1109\/CVPR.2016.41"},{"key":"3650_CR34","doi-asserted-by":"crossref","unstructured":"Yu, C.J., Zhao, X.Y., Zheng, Q., Zhang, P., You, X.G.: Hierarchical bilinear pooling for fine-grained visual recognition. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 574\u2013589 (2018)","DOI":"10.1007\/978-3-030-01270-0_35"},{"issue":"3","key":"3650_CR35","first-page":"3554","volume":"45","author":"Y Song","year":"2022","unstructured":"Song, Y., Sebe, N., Wang, W.: On the eigenvalues of global covariance pooling for fine-grained visual recognition. IEEE Trans. Pattern Anal. Mach. Intell. 45(3), 3554\u20133566 (2022)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"12","key":"3650_CR36","doi-asserted-by":"publisher","first-page":"6116","DOI":"10.1109\/TIP.2019.2924811","volume":"28","author":"XS Wei","year":"2019","unstructured":"Wei, X.S., Wang, P., Liu, L.Q., Shen, C.H., Wu, J.X.: Piecewise classifier mappings: learning fine-grained learners for novel categories with few examples. IEEE Trans. Image Process. 28(12), 6116\u20136125 (2019)","journal-title":"IEEE Trans. Image Process."},{"key":"3650_CR37","doi-asserted-by":"publisher","first-page":"1666","DOI":"10.1109\/TMM.2020.3001510","volume":"23","author":"HX Huang","year":"2020","unstructured":"Huang, H.X., Zhang, J.J., Zhang, J., Xu, J.S., Wu, Q.: Low-rank pairwise alignment bilinear network for few-shot fine-grained image classification. IEEE Trans. Multimedia 23, 1666\u20131680 (2020)","journal-title":"IEEE Trans. Multimedia"},{"key":"3650_CR38","unstructured":"Wah, C., Branson, S., Welinder, P., Perona, P., Belongie, S.: The caltech-ucsd birds-200\u20132011 dataset. (2011)."},{"key":"3650_CR39","unstructured":"Chen, W.Y., Liu, Y.C., Kira, Z., Wang, Y.C.F., Huang, J.B.: A closer look at few-shot classification. (2019)"},{"key":"3650_CR40","doi-asserted-by":"crossref","unstructured":"Ye, H.J., Hu, H.X., Zhan, D.C., Sha, F.: Few-shot learning via embedding adaptation with set-to-set functions. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 8808\u20138817 (2020)","DOI":"10.1109\/CVPR42600.2020.00883"},{"key":"3650_CR41","unstructured":"Khosla, A., Jayadevaprakash, N., Yao, B.P., Li, F.F.: Novel dataset for fine-grained image categorization: Stanford dogs. In: Proc. CVPR Workshop on Fine-Grained Visual Categorization (FGVC), vol. 2, no. 1. Citeseer, (2011)"},{"issue":"3","key":"3650_CR42","first-page":"2821","volume":"37","author":"JJ Wu","year":"2023","unstructured":"Wu, J.J., Chang, D.L., Sain, A., Li, X.X., Ma, Z.Y., Cao, J., Guo, J., Song, Y.Z.: Bi-directional feature reconstruction network for fine-grained few-shot image classification. Proc. AAAI Conf. AI 37(3), 2821\u20132829 (2023)","journal-title":"Proc. AAAI Conf. AI"},{"key":"3650_CR43","doi-asserted-by":"crossref","unstructured":"Zhu, Y.H., Liu, C.L., Jiang, S.Q.: Multi-attention meta learning for few-shot fine-grained image recognition. In: IJCAI, pp. 1090\u20131096 (2020)","DOI":"10.24963\/ijcai.2020\/152"},{"key":"3650_CR44","doi-asserted-by":"crossref","unstructured":"Krause, J., Stark, M., Deng, J., Li, F.F.: 3d object representations for fine-grained categorization. In: Proceedings of the IEEE International Conference on Computer Vision Workshops, pp. 554\u2013561 (2013)","DOI":"10.1109\/ICCVW.2013.77"},{"key":"3650_CR45","doi-asserted-by":"crossref","unstructured":"Zhang, H.G., Koniusz, P.: Power normalizing second-order similarity network for few-shot learning. In: 2019 IEEE Winter Conference on Applications of Computer Vision (WACV), pp. 1185\u20131193. IEEE (2019)","DOI":"10.1109\/WACV.2019.00131"},{"key":"3650_CR46","doi-asserted-by":"publisher","first-page":"16","DOI":"10.1016\/j.neucom.2021.09.016","volume":"466","author":"CF Wang","year":"2021","unstructured":"Wang, C.F., Song, S.J., Yang, Q.S., Li, X., Huang, G.: Fine-grained few shot learning with foreground object transformation. Neurocomputing 466, 16\u201326 (2021)","journal-title":"Neurocomputing"},{"key":"3650_CR47","doi-asserted-by":"crossref","unstructured":"Lee, S.B., Moon, W.J., Heo, J.P.: Task discrepancy maximization for fine-grained few-shot classification. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 5331\u20135340 (2022)","DOI":"10.1109\/CVPR52688.2022.00526"},{"issue":"8","key":"3650_CR48","doi-asserted-by":"publisher","first-page":"3947","DOI":"10.1109\/TCSVT.2023.3236636","volume":"33","author":"ZC Zha","year":"2023","unstructured":"Zha, Z.C., Tang, H., Sun, Y.L., Tang, J.H.: Boosting few-shot fine-grained recognition with background suppression and foreground alignment. IEEE Trans. Circ. Syst. Video Technol. 33(8), 3947\u20133961 (2023)","journal-title":"IEEE Trans. Circ. Syst. Video Technol."},{"key":"3650_CR49","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2022.108792","volume":"130","author":"H Tang","year":"2022","unstructured":"Tang, H., Yuan, C.C., Li, Z.C., Tang, J.H.: Learning attention-guided pyramidal features for few-shot fine-grained recognition. Pattern Recogn. 130, 108792 (2022)","journal-title":"Pattern Recogn."},{"issue":"2","key":"3650_CR50","doi-asserted-by":"publisher","first-page":"853","DOI":"10.1109\/TCSVT.2021.3065693","volume":"32","author":"HX Huang","year":"2021","unstructured":"Huang, H.X., Zhang, J.J., Yu, L.T., Zhang, J., Wu, Q., Xu, C.: TOAN: target-oriented alignment network for fine-grained image categorization with few labeled samples. IEEE Trans. Circ. Syst. Video Technol. 32(2), 853\u2013866 (2021)","journal-title":"IEEE Trans. Circ. Syst. Video Technol."},{"key":"3650_CR51","doi-asserted-by":"publisher","first-page":"1318","DOI":"10.1109\/TIP.2020.3043128","volume":"30","author":"XX Li","year":"2020","unstructured":"Li, X.X., Wu, J.J., Sun, Z., Ma, Z.Y., Cao, J., Xue, J.H.: BSNet: Bi-similarity network for few-shot fine-grained image classification. IEEE Trans. Image Process. 30, 1318\u20131331 (2020)","journal-title":"IEEE Trans. Image Process."}],"container-title":["The Visual Computer"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-024-03650-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00371-024-03650-6\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-024-03650-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,16]],"date-time":"2025-04-16T06:21:01Z","timestamp":1744784461000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00371-024-03650-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,9,26]]},"references-count":51,"journal-issue":{"issue":"6","published-print":{"date-parts":[[2025,4]]}},"alternative-id":["3650"],"URL":"https:\/\/doi.org\/10.1007\/s00371-024-03650-6","relation":{"has-preprint":[{"id-type":"doi","id":"10.21203\/rs.3.rs-4661763\/v1","asserted-by":"object"}]},"ISSN":["0178-2789","1432-2315"],"issn-type":[{"value":"0178-2789","type":"print"},{"value":"1432-2315","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,9,26]]},"assertion":[{"value":"7 September 2024","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"26 September 2024","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}