{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,1]],"date-time":"2026-04-01T18:47:28Z","timestamp":1775069248526,"version":"3.50.1"},"reference-count":93,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2024,7,30]],"date-time":"2024-07-30T00:00:00Z","timestamp":1722297600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,7,30]],"date-time":"2024-07-30T00:00:00Z","timestamp":1722297600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Comput Vis"],"published-print":{"date-parts":[[2025,1]]},"DOI":"10.1007\/s11263-024-02189-2","type":"journal-article","created":{"date-parts":[[2024,7,30]],"date-time":"2024-07-30T18:32:12Z","timestamp":1722364332000},"page":"372-397","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Equiangular Basis Vectors: A Novel Paradigm for Classification Tasks"],"prefix":"10.1007","volume":"133","author":[{"given":"Yang","family":"Shen","sequence":"first","affiliation":[]},{"given":"Xuhao","family":"Sun","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8200-1845","authenticated-orcid":false,"given":"Xiu-Shen","family":"Wei","sequence":"additional","affiliation":[]},{"given":"Anqi","family":"Xu","sequence":"additional","affiliation":[]},{"given":"Lingyan","family":"Gao","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,7,30]]},"reference":[{"key":"2189_CR1","unstructured":"Bao, H., Dong, L., Piao, S., & Wei, F. (2021). Beit: Bert pre-training of image transformers. arXiv preprint arXiv:2106.08254"},{"key":"2189_CR2","unstructured":"Bellet, A., Habrard, A., & Sebban, M. (2013). A survey on metric learning for feature vectors and structured data. arXiv preprint arXiv:1306.6709"},{"key":"2189_CR3","unstructured":"Cao, K., Wei, C., Gaidon, A., Arechiga, N., & Ma, T. (2019). Learning imbalanced datasets with label-distribution-aware margin loss. Advances in Neural Information Processing Systems, pp. 1567\u20131578"},{"key":"2189_CR4","doi-asserted-by":"crossref","unstructured":"Caron, M., Touvron, H., Misra, I., J\u00e9gou, H., Mairal, J., Bojanowski, P., & Joulin, A. (2021). Emerging properties in self-supervised vision transformers. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 9650\u20139660","DOI":"10.1109\/ICCV48922.2021.00951"},{"issue":"5","key":"2189_CR5","doi-asserted-by":"publisher","first-page":"1055","DOI":"10.1109\/72.788646","volume":"10","author":"O Chapelle","year":"1999","unstructured":"Chapelle, O., Haffner, P., & Vapnik, V. N. (1999). Support vector machines for histogram-based image classification. IEEE Transactions on Neural Networks, 10(5), 1055\u20131064.","journal-title":"IEEE Transactions on Neural Networks"},{"key":"2189_CR6","unstructured":"Chen, T., Kornblith, S., Norouzi, M., & Hinton, G. (2020). A simple framework for contrastive learning of visual representations. In International Conference on Machine Learning, pp. 1597\u20131607"},{"key":"2189_CR7","unstructured":"Chen, K., Wang, J., Pang, J., Cao, Y., Xiong, Y., Li, X., Sun, S., Feng, W., Liu, Z., Xu, J., Zhang, Z., Cheng, D., Zhu, C., Cheng, T., Zhao, Q., Li, B., Lu, X., Zhu, R., Wu, Y., Dai, J., Wang, J., Shi, J., Ouyang, W., Loy, C.C., & Lin, D. (2019). MMDetection: Open MMLab detection toolbox and benchmark. arXiv preprint arXiv:1906.07155"},{"key":"2189_CR8","doi-asserted-by":"crossref","unstructured":"Cimpoi, M., Maji, S., Kokkinos, I., Mohamed, S., & Vedaldi, A. (2014). Describing textures in the wild. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 3606\u20133613","DOI":"10.1109\/CVPR.2014.461"},{"key":"2189_CR9","unstructured":"Contributors, M. (2020). MMSegmentation: Open MMLab semantic segmentation toolbox and benchmark. Available online: https:\/\/github.com\/open-mmlab\/mmsegmentation (Retrieved on 18 May 2022)"},{"key":"2189_CR10","first-page":"795","volume":"13","author":"C Cortes","year":"2012","unstructured":"Cortes, C., Mohri, M., & Rostamizadeh, A. (2012). Algorithms for learning kernels based on centered alignment. Journal of Machine Learning Research, 13, 795\u2013828.","journal-title":"Journal of Machine Learning Research"},{"issue":"1","key":"2189_CR11","doi-asserted-by":"publisher","first-page":"19","DOI":"10.1007\/s10479-005-5724-z","volume":"134","author":"PT De Boer","year":"2005","unstructured":"De Boer, P. T., Kroese, D. P., Mannor, S., & Rubinstein, R. Y. (2005). A tutorial on the cross-entropy method. Annals of Operations Research, 134(1), 19\u201367.","journal-title":"Annals of Operations Research"},{"key":"2189_CR12","doi-asserted-by":"crossref","unstructured":"Deng, J., Dong, W., Socher, R., Li, L.J., Li, K., & Fei-Fei, L. (2009). ImageNet: A large-scale hierarchical image database. In IEEE conference on computer vision and pattern recognition, pp. 248\u2013255","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"2189_CR13","doi-asserted-by":"crossref","unstructured":"Deng, J., Guo, J., Xue, N., & Zafeiriou, S. (2019). Arcface: Additive angular margin loss for deep face recognition. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 4690\u20134699","DOI":"10.1109\/CVPR.2019.00482"},{"key":"2189_CR14","unstructured":"Dosovitskiy, A., Beyer, L., Kolesnikov, A., Weissenborn, D., Zhai, X., Unterthiner, T., Dehghani, M., Minderer, M., Heigold, G., Gelly, S., Uszkoreit, J., & Houlsby, N. (2020). An image is worth 16x16 words: Transformers for image recognition at scale. arXiv preprint arXiv:2010.11929"},{"key":"2189_CR15","doi-asserted-by":"crossref","unstructured":"Elad, M. (2010). Sparse and redundant representations: from theory to applications in signal and image processing, vol.\u00a02. Springer","DOI":"10.1007\/978-1-4419-7011-4"},{"key":"2189_CR16","unstructured":"Ericson, T., & Zinoviev, V. (2001). Codes on Euclidean spheres. Elsevier"},{"key":"2189_CR17","doi-asserted-by":"publisher","first-page":"810","DOI":"10.1016\/j.aim.2018.03.024","volume":"330","author":"A Glazyrin","year":"2018","unstructured":"Glazyrin, A., & Yu, W. H. (2018). Upper bounds for s-distance sets and equiangular lines. Advances in Mathematics, 330, 810\u2013833.","journal-title":"Advances in Mathematics"},{"key":"2189_CR18","unstructured":"Gretton, A., Fukumizu, K., Teo, C., Song, L., Sch\u00f6lkopf, B., & Smola, A. (2007). A kernel statistical test of independence. Advances in neural information processing systems, pp. 585\u2013592"},{"key":"2189_CR19","doi-asserted-by":"crossref","unstructured":"Guo, Y., Wang, X., Chen, Y., & Yu, S.X. (2022). Clipped hyperbolic classifiers are super-hyperbolic classifiers. In Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 11\u201320","DOI":"10.1109\/CVPR52688.2022.00010"},{"key":"2189_CR20","doi-asserted-by":"crossref","unstructured":"He, K., Chen, X., Xie, S., Li, Y., Doll\u00e1r, P., & Girshick, R. (2022). Masked autoencoders are scalable vision learners. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 16000\u201316009","DOI":"10.1109\/CVPR52688.2022.01553"},{"key":"2189_CR21","doi-asserted-by":"crossref","unstructured":"He, K., Gkioxari, G., Doll\u00e1r, P., & Girshick, R. (2017). Mask R-CNN. In IEEE international conference on computer vision, pp. 2961\u20132969","DOI":"10.1109\/ICCV.2017.322"},{"key":"2189_CR22","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., & Sun, J. (2016). Deep residual learning for image recognition. In Proceedings of the IEEE conference on computer vision and pattern recognition, pp. 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"key":"2189_CR23","unstructured":"Hinton, G., Vinyals, O., & Dean, J. (2015). Distilling the knowledge in a neural network. arXiv preprint arXiv:1503.02531"},{"key":"2189_CR24","doi-asserted-by":"crossref","unstructured":"Hu, G., Xu, Z., Wang, G., Zeng, B., Liu, Y., & Lei, Y. (2021). Forecasting energy consumption of long-distance oil products pipeline based on improved fruit fly optimization algorithm and support vector regression. Energy, 224, 120153.","DOI":"10.1016\/j.energy.2021.120153"},{"issue":"3","key":"2189_CR25","doi-asserted-by":"publisher","first-page":"729","DOI":"10.4007\/annals.2021.194.3.3","volume":"194","author":"Z Jiang","year":"2021","unstructured":"Jiang, Z., Tidor, J., Yao, Y., Zhang, S., & Zhao, Y. (2021). Equiangular lines with a fixed angle. Annals of Mathematics, 194(3), 729\u2013743.","journal-title":"Annals of Mathematics"},{"issue":"2","key":"2189_CR26","first-page":"355","volume":"22","author":"H Johannes","year":"1948","unstructured":"Johannes, H. (1948). Equilateral point-sets in elliptic two- and three-dimensional spaces. Nieuw Arch. Wiskunde, 22(2), 355\u2013362.","journal-title":"Nieuw Arch. Wiskunde"},{"issue":"9","key":"2189_CR27","first-page":"1066","volume":"11","author":"M Kaya","year":"2019","unstructured":"Kaya, M., & Bilge, H. \u015e. (2019). Symmetry. Deep metric learning: A survey, 11(9), 1066.","journal-title":"Deep metric learning: A survey"},{"key":"2189_CR28","unstructured":"Kingma, D.P., & Ba, J. (2014). Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980"},{"key":"2189_CR29","doi-asserted-by":"crossref","unstructured":"Kirillov, A., Girshick, R., He, K., & Doll\u00e1r, P. (2019). Panoptic feature pyramid networks. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 6399\u20136408","DOI":"10.1109\/CVPR.2019.00656"},{"key":"2189_CR30","doi-asserted-by":"crossref","unstructured":"Kolesnikov, A., Beyer, L., Zhai, X., Puigcerver, J., Yung, J., Gelly, S., & Houlsby, N. (2020). Big Transfer (BiT): General visual representation learning. In European Conference Computer Vision pp. 491\u2013507. Springer","DOI":"10.1007\/978-3-030-58558-7_29"},{"key":"2189_CR31","unstructured":"Kornblith, S., Norouzi, M., Lee, H., & Hinton, G. (2019). Similarity of neural network representations revisited. In International conference on machine learning, pp. 3519\u20133529"},{"issue":"6","key":"2189_CR32","doi-asserted-by":"publisher","first-page":"84","DOI":"10.1145\/3065386","volume":"60","author":"A Krizhevsky","year":"2017","unstructured":"Krizhevsky, A., Sutskever, I., & Hinton, G. E. (2017). ImageNet classification with deep convolutional neural networks. Communications of the ACM, 60(6), 84\u201390.","journal-title":"Communications of the ACM"},{"issue":"11","key":"2189_CR33","doi-asserted-by":"publisher","first-page":"2278","DOI":"10.1109\/5.726791","volume":"86","author":"Y LeCun","year":"1998","unstructured":"LeCun, Y., Bottou, L., Bengio, Y., & Haffner, P. (1998). Gradient-based learning applied to document recognition. Proceedings of the IEEE, 86(11), 2278\u20132324.","journal-title":"Proceedings of the IEEE"},{"key":"2189_CR34","doi-asserted-by":"crossref","unstructured":"Lin, T.Y., Maire, M., Belongie, S., Hays, J., Perona, P., Ramanan, D., Doll\u00e1r, P., & Zitnick, C.L. (2014). Microsoft COCO: Common objects in context. In European Conference Computer Vision., pp. 740\u2013755","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"2189_CR35","doi-asserted-by":"crossref","unstructured":"Liu, Z., Hu, H., Lin, Y., Yao, Z., Xie, Z., Wei, Y., Ning, J., Cao, Y., Zhang, Z., Dong, L., et\u00a0al. (2022). Swin transformer v2: Scaling up capacity and resolution. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 12009\u201312019","DOI":"10.1109\/CVPR52688.2022.01170"},{"key":"2189_CR36","doi-asserted-by":"crossref","unstructured":"Liu, Z., Lin, Y., Cao, Y., Hu, H., Wei, Y., Zhang, Z., Lin, S., & Guo, B. (2021). Swin transformer: Hierarchical vision transformer using shifted windows. In: International Conference on Computer Vision, pp. 10012\u201310022","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"2189_CR37","doi-asserted-by":"crossref","unstructured":"Liu, Z., Mao, H., Wu, C.Y., Feichtenhofer, C., Darrell, T., & Xie, S. (2022). A ConvNet for the 2020s. In Proceedings of the IEEE\/CVF conference on computer vision and pattern recognition, pp. 11976\u201311986","DOI":"10.1109\/CVPR52688.2022.01167"},{"key":"2189_CR38","first-page":"21464","volume":"33","author":"W Liu","year":"2020","unstructured":"Liu, W., Wang, X., Owens, J., & Li, Y. (2020). Energy-based out-of-distribution detection. Adv. Neural Inform. Process. Syst., 33, 21464\u201321475.","journal-title":"Adv. Neural Inform. Process. Syst."},{"key":"2189_CR39","unstructured":"Loshchilov, I., & Hutter, F. (2017). Decoupled weight decay regularization. arXiv preprint arXiv:1711.05101"},{"issue":"5","key":"2189_CR40","doi-asserted-by":"publisher","first-page":"823","DOI":"10.1080\/01431160600746456","volume":"28","author":"D Lu","year":"2007","unstructured":"Lu, D., & Weng, Q. (2007). A survey of image classification methods and techniques for improving classification performance. International Journal of Remote Sensing, 28(5), 823\u2013870.","journal-title":"International Journal of Remote Sensing"},{"key":"2189_CR41","unstructured":"Maji, S., Rahtu, E., Kannala, J., Blaschko, M., & Vedaldi, A. (2013). Fine-grained visual classification of aircraft. arXiv preprint arXiv:1306.5151"},{"issue":"9","key":"2189_CR42","doi-asserted-by":"publisher","first-page":"2784","DOI":"10.1080\/01431161.2018.1433343","volume":"39","author":"AE Maxwell","year":"2018","unstructured":"Maxwell, A. E., Warner, T. A., & Fang, F. (2018). Implementation of machine-learning classification in remote sensing: An applied review. International Journal of Remote Sensing, 39(9), 2784\u20132817.","journal-title":"International Journal of Remote Sensing"},{"key":"2189_CR43","unstructured":"McCallum, A., Freitag, D., & Pereira, F.C. (2000). Maximum entropy markov models for information extraction and segmentation. In: International Conference on Machine Learning., pp. 591\u2013598"},{"issue":"11","key":"2189_CR44","doi-asserted-by":"publisher","first-page":"2624","DOI":"10.1109\/TPAMI.2013.83","volume":"35","author":"T Mensink","year":"2013","unstructured":"Mensink, T., Verbeek, J., Perronnin, F., & Csurka, G. (2013). Distance-based image classification: Generalizing to new classes at near-zero cost. IEEE Transactions on Pattern Analysis and Machine Intelligence, 35(11), 2624\u20132637.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2189_CR45","unstructured":"Mettes, P., Van\u00a0der Pol, E., & Snoek, C. (2019). Hyperspherical prototype networks. Advances in neural information processing systems"},{"key":"2189_CR46","doi-asserted-by":"crossref","unstructured":"M\u00fcller, S.G., & Hutter, F. (2021). Trivialaugment: Tuning-free yet state-of-the-art data augmentation. In Proceedings of the IEEE\/CVF international conference on computer vision, pp. 774\u2013782","DOI":"10.1109\/ICCV48922.2021.00081"},{"key":"2189_CR47","unstructured":"Netzer, Y., Wang, T., Coates, A., Bissacco, A., Wu, B., & Ng, A.Y. (2011). Reading digits in natural images with unsupervised feature learning. Adv. Neural Inform. Process. Syst. Worksh., pp. 1\u20139"},{"key":"2189_CR48","doi-asserted-by":"crossref","unstructured":"Pernici, F., Bruni, M., Baecchi, C., & Del\u00a0Bimbo, A. (2021). Regular polytope networks. Adv. Neural Inform. Process. Syst., pp. 4373\u20134387","DOI":"10.1109\/TNNLS.2021.3056762"},{"key":"2189_CR49","unstructured":"Ranjan, R., Castillo, C.D., & Chellappa, R. (2017). L2-constrained softmax loss for discriminative face verification. arXiv preprint arXiv:1703.09507"},{"key":"2189_CR50","doi-asserted-by":"crossref","unstructured":"Rao, H., Leung, C., & Miao, C. (2023). Hierarchical skeleton meta-prototype contrastive learning with hard skeleton mining for unsupervised person re-identification. Int. J. Comput. Vis. pp. 1\u201323","DOI":"10.1007\/s11263-023-01864-0"},{"issue":"9","key":"2189_CR51","doi-asserted-by":"publisher","first-page":"2352","DOI":"10.1162\/neco_a_00990","volume":"29","author":"W Rawat","year":"2017","unstructured":"Rawat, W., & Wang, Z. (2017). Deep convolutional neural networks for image classification: A comprehensive review. Neural Computation, 29(9), 2352\u20132449.","journal-title":"Neural Computation"},{"issue":"6","key":"2189_CR52","doi-asserted-by":"publisher","first-page":"2171","DOI":"10.1063\/1.1737053","volume":"45","author":"JM Renes","year":"2004","unstructured":"Renes, J. M., Blume-Kohout, R., Scott, A. J., & Caves, C. M. (2004). Symmetric informationally complete quantum measurements. Journal of Mathematical Physics, 45(6), 2171\u20132180.","journal-title":"Journal of Mathematical Physics"},{"key":"2189_CR53","doi-asserted-by":"crossref","unstructured":"Robbins, H., & Monro, S. (1951). A stochastic approximation method. The Annals of Mathematical Statistics pp. 400\u2013407","DOI":"10.1214\/aoms\/1177729586"},{"key":"2189_CR54","unstructured":"Rudin, W. (1953). Principles of mathematical analysis"},{"issue":"3","key":"2189_CR55","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1007\/s11263-015-0816-y","volume":"115","author":"O Russakovsky","year":"2015","unstructured":"Russakovsky, O., Deng, J., Su, H., Krause, J., Satheesh, S., Ma, S., Huang, Z., Karpathy, A., Khosla, A., Bernstein, M., Berg, C. A., & Fei-Fei, L. (2015). ImageNet large scale visual recognition challenge. International Journal of Computer Vision, 115(3), 211\u2013252.","journal-title":"International Journal of Computer Vision"},{"key":"2189_CR56","doi-asserted-by":"crossref","unstructured":"Selvaraju, R.R., Cogswell, M., Das, A., Vedantam, R., Parikh, D., & Batra, D.(2017). Grad-CAM: Visual explanations from deep networks via gradient-based localization. International Journal of Computer Vision., pp. 618\u2013626","DOI":"10.1109\/ICCV.2017.74"},{"key":"2189_CR57","doi-asserted-by":"crossref","unstructured":"Shen, Y., Sun, X., & Wei, X.S. (2023). Equiangular basis vectors. arXiv preprint arXiv:2303.11637","DOI":"10.1109\/CVPR52729.2023.01131"},{"key":"2189_CR58","unstructured":"Snell, J., Swersky, K., & Zemel, R. (2017). Prototypical networks for few-shot learning. Advances in Neural Information Processing Systems, pp. 4080\u20134090"},{"issue":"3","key":"2189_CR59","doi-asserted-by":"publisher","first-page":"257","DOI":"10.1016\/S1063-5203(03)00023-X","volume":"14","author":"T Strohmer","year":"2003","unstructured":"Strohmer, T., & Heath, R. W., Jr. (2003). Grassmannian frames with applications to coding and communication. Applied and Computational Harmonic Analysis, 14(3), 257\u2013275.","journal-title":"Applied and Computational Harmonic Analysis"},{"key":"2189_CR60","unstructured":"Szegedy, C., Toshev, A., & Erhan, D. (2013). Deep neural networks for object detection. Advances in Neural Information Processing Systems., pp. 2553\u20132561"},{"key":"2189_CR61","doi-asserted-by":"crossref","unstructured":"Szegedy, C., Vanhoucke, V., Ioffe, S., Shlens, J., & Wojna, Z. (2016). Rethinking the inception architecture for computer vision. In The IEEE \/ CVF Computer Vision and Pattern Recognition Conference., pp. 2818\u20132826","DOI":"10.1109\/CVPR.2016.308"},{"issue":"1","key":"2189_CR62","first-page":"1","volume":"27","author":"PML Tammes","year":"1930","unstructured":"Tammes, P. M. L. (1930). On the origin of number and arrangement of the places of exit on the surface of pollen-grains. Recueil Des Travaux Botaniques N\u00e9erlandais, 27(1), 1\u201384.","journal-title":"Recueil Des Travaux Botaniques N\u00e9erlandais"},{"key":"2189_CR63","doi-asserted-by":"crossref","unstructured":"Tulyakov, S., Jaeger, S., Govindaraju, V., & Doermann, D. (2008). Review of classifier combination methods. Machine learning in document analysis and recognition. pp. 361\u2013386","DOI":"10.1007\/978-3-540-76280-5_14"},{"issue":"3","key":"2189_CR64","doi-asserted-by":"publisher","first-page":"335","DOI":"10.1016\/S1385-7258(66)50038-5","volume":"28","author":"JH van Lint","year":"1966","unstructured":"van Lint, J. H., & Seidel, J. J. (1966). Equilateral point sets in elliptic geometry. Indagationes Mathematicae, 28(3), 335\u2013348.","journal-title":"Indagationes Mathematicae"},{"key":"2189_CR65","unstructured":"Van\u00a0der Maaten, L., & Hinton, G. (2008). Visualizing data using t-SNE. Journal of Machine Learning Research9(11)"},{"key":"2189_CR66","doi-asserted-by":"crossref","unstructured":"Van\u00a0Horn, G., Mac\u00a0Aodha, O., Song, Y., Cui, Y., Sun, C., Shepard, A., Adam, H., Perona, P., & Belongie, S. (2018). The iNaturalist species classification and detection dataset. In: The IEEE \/ CVF Computer Vision and Pattern Recognition Conference, pp. 8769\u20138778","DOI":"10.1109\/CVPR.2018.00914"},{"key":"2189_CR67","unstructured":"Vaswani, A., Shazeer, N., Parmar, N., Uszkoreit, J., Jones, L., Gomez, A.N., Kaiser, \u0141., & Polosukhin, I. (2017). Attention is all you need. Advances in Neural Information Processing Systems, pp. 6000\u20136010"},{"key":"2189_CR68","unstructured":"Vryniotis, V. (2021). How to train State-of-The-Art models using TorchVision\u2019s latest primitives. https:\/\/pytorch.org\/blog\/how-to-train-state-of-the-art-models-using-torchvision-latest-primitives\/"},{"key":"2189_CR69","unstructured":"Wah, C., Branson, S., Welinder, P., Perona, P., & Belongie, S. (2011). The Caltech-UCSD birds-200-2011 dataset. Tech. Report CNS-TR-2011-001"},{"key":"2189_CR70","doi-asserted-by":"crossref","unstructured":"Wang, J., Song, Y., Leung, T., Rosenberg, C., Wang, J., Philbin, J., Chen, B., & Wu, Y. (2014). Learning fine-grained image similarity with deep ranking. In The IEEE \/ CVF Computer Vision and Pattern Recognition Conference, pp. 1386\u20131393","DOI":"10.1109\/CVPR.2014.180"},{"key":"2189_CR71","doi-asserted-by":"crossref","unstructured":"Wang, H., Wang, Y., Zhou, Z., Ji, X., Gong, D., Zhou, J., Li, Z., & Liu, W. (2018). Cosface: Large margin cosine loss for deep face recognition. In: The IEEE \/ CVF Computer Vision and Pattern Recognition Conference, pp. 5265\u20135274","DOI":"10.1109\/CVPR.2018.00552"},{"key":"2189_CR72","doi-asserted-by":"crossref","unstructured":"Wang, F., Xiang, X., Cheng, J., & Yuille, A.L. (2017). Normface: L2 hypersphere embedding for face verification. In: ACM International Conference Multimedia, pp. 1041\u20131049","DOI":"10.1145\/3123266.3123359"},{"issue":"2","key":"2189_CR73","first-page":"207","volume":"10","author":"KQ Weinberger","year":"2009","unstructured":"Weinberger, K. Q., & Saul, L. K. (2009). Distance metric learning for large margin nearest neighbor classification. Journal of Machine Learning Research, 10(2), 207\u2013244.","journal-title":"Journal of Machine Learning Research"},{"issue":"12","key":"2189_CR74","doi-asserted-by":"publisher","first-page":"8927","DOI":"10.1109\/TPAMI.2021.3126648","volume":"44","author":"XS Wei","year":"2022","unstructured":"Wei, X. S., Song, Y. Z., Mac Aodha, O., Wu, J., Peng, Y., Tang, J., Yang, J., & Belongie, S. (2022). Fine-grained image analysis with deep learning: A survey. IEEE Transactions on Pattern Analysis and Machine Intelligence, 44(12), 8927\u20138948.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2189_CR75","doi-asserted-by":"crossref","unstructured":"Wen, Y., Zhang, K., Li, Z., & Qiao, Y. (2016). A discriminative feature learning approach for deep face recognition. In European Conference Computer Vision, pp. 499\u2013515","DOI":"10.1007\/978-3-319-46478-7_31"},{"key":"2189_CR76","unstructured":"Wightman, R., Touvron, H., & J\u00e9gou, H. (2021). ResNet strikes back: An improved training procedure in timm. arXiv preprint arXiv:2110.00476"},{"key":"2189_CR77","doi-asserted-by":"crossref","unstructured":"Wu, Z., Xiong, Y., Yu, S.X., & Lin, D. (2018). Unsupervised feature learning via non-parametric instance discrimination. In The IEEE \/ CVF Computer Vision and Pattern Recognition Conference, pp. 3733\u20133742","DOI":"10.1109\/CVPR.2018.00393"},{"key":"2189_CR78","doi-asserted-by":"crossref","unstructured":"Xiao, T., Liu, Y., Zhou, B., Jiang, Y., & Sun, J. (2018). Unified perceptual parsing for scene understanding. In European Conference Computer Vision., pp. 418\u2013434","DOI":"10.1007\/978-3-030-01228-1_26"},{"key":"2189_CR79","unstructured":"Xu, P., Ehinger, K.A., Zhang, Y., Finkelstein, A., Kulkarni, S.R., & Xiao, J. (2015). Turkergaze: Crowdsourcing saliency with webcam based eye tracking. arXiv preprint arXiv:1504.06755"},{"issue":"7","key":"2189_CR80","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1007\/s11263-022-01613-9","volume":"130","author":"W Xu","year":"2022","unstructured":"Xu, W., Xian, Y., Wang, J., Schiele, B., & Akata, Z. (2022). Attribute prototype network for any-shot learning. International Journal of Computer Vision, 130(7), 1735\u20131753.","journal-title":"International Journal of Computer Vision"},{"key":"2189_CR81","unstructured":"Yang, Y., Xie, L., Chen, S., Li, X., Lin, Z., & Tao, D. (2022). Do we really need a learnable classifier at the end of deep neural network? arXiv preprint arXiv:2203.09081"},{"issue":"11","key":"2189_CR82","doi-asserted-by":"publisher","first-page":"3878","DOI":"10.1109\/TPAMI.2020.2994749","volume":"43","author":"HJ Ye","year":"2022","unstructured":"Ye, H. J., Zhan, D. C., Jiang, Y., & Zhou, Z. H. (2022). Heterogeneous few-shot model rectification with semantic mapping. IEEE Transactions on Pattern Analysis and Machine Intelligence, 43(11), 3878\u20133891.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"2189_CR83","unstructured":"Yu, F., Seff, A., Zhang, Y., Song, S., Funkhouser, T., & Xiao, J. (2015). Lsun: Construction of a large-scale image dataset using deep learning with humans in the loop. arXiv preprint arXiv:1506.03365"},{"key":"2189_CR84","doi-asserted-by":"crossref","unstructured":"Yun, S., Han, D., Oh, S.J., Chun, S., Choe, J., & Yoo, Y. (2019). CutMix: Regularization strategy to train strong classifiers with localizable features. In International Conference on Computer Vision, pp. 6023\u20136032","DOI":"10.1109\/ICCV.2019.00612"},{"key":"2189_CR85","doi-asserted-by":"crossref","unstructured":"Zagoruyko, S., & Komodakis, N. (2016). Wide residual networks. arXiv preprint arXiv:1605.07146","DOI":"10.5244\/C.30.87"},{"key":"2189_CR86","doi-asserted-by":"crossref","unstructured":"Zhai, X., Kolesnikov, A., Houlsby, N., & Beyer, L. (2022). Scaling vision transformers. In The IEEE \/ CVF Computer Vision and Pattern Recognition Conference pp. 12104\u201312113","DOI":"10.1109\/CVPR52688.2022.01179"},{"key":"2189_CR87","unstructured":"Zhang, H., Cisse, M., Dauphin, Y.N., & Lopez-Paz, D. (2017). mixup: Beyond empirical risk minimization. arXiv preprint arXiv:1710.09412"},{"key":"2189_CR88","doi-asserted-by":"crossref","unstructured":"Zhong, Z., Zheng, L., Kang, G., Li, S., & Yang, Y. (2020). Random erasing data augmentation. In: AAAI, pp. 13001\u201313008","DOI":"10.1609\/aaai.v34i07.7000"},{"key":"2189_CR89","doi-asserted-by":"crossref","unstructured":"Zhou, Z. H. (2016). Learnware: On the future of machine learning. Frontiers of Computer Science,10(4), 589\u2013590.","DOI":"10.1007\/s11704-016-6906-3"},{"key":"2189_CR90","doi-asserted-by":"crossref","unstructured":"Zhou, B., Cui, Q., Wei, X.S., & Chen, Z.M. (2020). BBN: Bilateral-branch network with cumulative learning for long-tailed visual recognition. In The IEEE \/ CVF Computer Vision and Pattern Recognition Conference, pp. 9719\u20139728","DOI":"10.1109\/CVPR42600.2020.00974"},{"key":"2189_CR91","doi-asserted-by":"crossref","unstructured":"Zhou, B., Lapedriza, A., Khosla, A., Oliva, A., & Torralba, A. (2017). Places: A 10 million image database for scene recognition. IEEE Transactions on Pattern Analysis and Machine Intelligence,40(6), 1452\u20131464.","DOI":"10.1109\/TPAMI.2017.2723009"},{"key":"2189_CR92","doi-asserted-by":"crossref","unstructured":"Zhou, H.Y., Lu, C., Chen, C., Yang, S., & Yu, Y. (2023). A unified visual information preservation framework for self-supervised pre-training in medical image analysis. IEEE Transactions on Pattern Analysis and Machine Intelligence, 45(7), 8020\u20138035.","DOI":"10.1109\/TPAMI.2023.3234002"},{"key":"2189_CR93","doi-asserted-by":"crossref","unstructured":"Zhou, B., Zhao, H., Puig, X., Xiao, T., Fidler, S., Barriuso, A., & Torralba, A. (2019). Semantic understanding of scenes through the ADE20k dataset. International Journal of Computer Vision, 127(3), 302\u2013321.","DOI":"10.1007\/s11263-018-1140-0"}],"container-title":["International Journal of Computer Vision"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-024-02189-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11263-024-02189-2\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11263-024-02189-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,7]],"date-time":"2025-01-07T06:14:42Z","timestamp":1736230482000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11263-024-02189-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,7,30]]},"references-count":93,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2025,1]]}},"alternative-id":["2189"],"URL":"https:\/\/doi.org\/10.1007\/s11263-024-02189-2","relation":{},"ISSN":["0920-5691","1573-1405"],"issn-type":[{"value":"0920-5691","type":"print"},{"value":"1573-1405","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,7,30]]},"assertion":[{"value":"19 October 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 July 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"30 July 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}