{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,24]],"date-time":"2026-03-24T01:06:23Z","timestamp":1774314383595,"version":"3.50.1"},"reference-count":48,"publisher":"Springer Science and Business Media LLC","issue":"5","license":[{"start":{"date-parts":[[2025,1,13]],"date-time":"2025-01-13T00:00:00Z","timestamp":1736726400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,13]],"date-time":"2025-01-13T00:00:00Z","timestamp":1736726400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62477006"],"award-info":[{"award-number":["62477006"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Appl Intell"],"published-print":{"date-parts":[[2025,4]]},"DOI":"10.1007\/s10489-024-06173-8","type":"journal-article","created":{"date-parts":[[2025,1,13]],"date-time":"2025-01-13T08:47:50Z","timestamp":1736758070000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["From spatial to semantic: attribute-aware fashion similarity learning via iterative positioning and attribute diverging"],"prefix":"10.1007","volume":"55","author":[{"given":"Yongquan","family":"Wan","sequence":"first","affiliation":[]},{"given":"Jianfei","family":"Zheng","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0313-8833","authenticated-orcid":false,"given":"Cairong","family":"Yan","sequence":"additional","affiliation":[]},{"given":"Guobing","family":"Zou","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,1,13]]},"reference":[{"key":"6173_CR1","doi-asserted-by":"crossref","unstructured":"Ma J, Sun H, Yang D, Zhang H (2024) Personalized fashion recommendations for diverse body shapes and local preferences with contrastive multimodal cross-attention network. ACM Transactions on Intelligent Systems and Technology","DOI":"10.1145\/3637217"},{"issue":"1","key":"6173_CR2","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3531017","volume":"19","author":"L De Divitiis","year":"2023","unstructured":"De Divitiis L, Becattini F, Baecchi C, Del Bimbo A (2023) Disentangling features for fashion recommendation. ACM Trans Multimed Comput Commun Appl 19(1):1\u201321","journal-title":"ACM Trans Multimed Comput Commun Appl"},{"key":"6173_CR3","doi-asserted-by":"crossref","unstructured":"Ma Y, Ding Y, Yang X, Liao L, Wong WK, Chua T-S (2020) Knowledge enhanced neural fashion trend forecasting. In: Proceedings of the 2020 International Conference on Multimedia Retrieval, pp 82\u201390","DOI":"10.1145\/3372278.3390677"},{"key":"6173_CR4","doi-asserted-by":"crossref","unstructured":"Mall U, Matzen K, Hariharan B, Snavely N, Bala K (2019) Geostyle: Discovering fashion trends and events. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 411\u2013420","DOI":"10.1109\/ICCV.2019.00050"},{"key":"6173_CR5","doi-asserted-by":"crossref","unstructured":"Al-Halah Z, Stiefelhagen R, Grauman K (2017) Fashion forward: Forecasting visual style in fashion. In: Proceedings of the IEEE International Conference on Computer Vision, pp 388\u2013397","DOI":"10.1109\/ICCV.2017.50"},{"issue":"4","key":"6173_CR6","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3447239","volume":"54","author":"W-H Cheng","year":"2021","unstructured":"Cheng W-H, Song S, Chen C-Y, Hidayati SC, Liu J (2021) Fashion meets computer vision: A survey. ACM Comput Surv 54(4):1\u201341","journal-title":"ACM Comput Surv"},{"issue":"5","key":"6173_CR7","doi-asserted-by":"publisher","first-page":"2687","DOI":"10.1109\/TCSVT.2021.3080920","volume":"32","author":"SR Dubey","year":"2021","unstructured":"Dubey SR (2021) A decade survey of content based image retrieval using deep learning. IEEE Trans Circuits Syst Video Technol 32(5):2687\u20132704","journal-title":"IEEE Trans Circuits Syst Video Technol"},{"issue":"4","key":"6173_CR8","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3624733","volume":"56","author":"Y Deldjoo","year":"2023","unstructured":"Deldjoo Y, Nazary F, Ramisa A, Mcauley J, Pellegrini G, Bellogin A, Noia TD (2023) A review of modern fashion recommender systems. ACM Comput Surv 56(4):1\u201337","journal-title":"ACM Comput Surv"},{"key":"6173_CR9","doi-asserted-by":"crossref","unstructured":"Duan K, Parikh D, Crandall D, Grauman K (2012) Discovering localized attributes for fine-grained recognition. In: Proceedings of the 2012 IEEE Conference on Computer Vision and Pattern Recognition, pp 3474\u20133481. IEEE","DOI":"10.1109\/CVPR.2012.6248089"},{"key":"6173_CR10","doi-asserted-by":"crossref","unstructured":"Huynh D, Elhamifar E (2020) Fine-grained generalized zero-shot learning via dense attribute-based attention. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 4483\u20134493","DOI":"10.1109\/CVPR42600.2020.00454"},{"key":"6173_CR11","doi-asserted-by":"crossref","unstructured":"Seo Y, Shin K-s (2018) Image classification of fine-grained fashion image based on style using pre-trained convolutional neural network. In: Proceedings of the 3rd International Conference on Big Data Analysis, pp 387\u2013390. IEEE","DOI":"10.1109\/ICBDA.2018.8367713"},{"key":"6173_CR12","doi-asserted-by":"crossref","unstructured":"Veit A, Belongie S, Karaletsos T (2017) Conditional similarity networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp 830\u2013838","DOI":"10.1109\/CVPR.2017.193"},{"key":"6173_CR13","unstructured":"Wan Y, Yan K, Yan C, Zhang B (2022) Learning attribute-guided fashion similarity with spatial and channel attention. J Exp Theor Artif Intell 1\u201317"},{"key":"6173_CR14","doi-asserted-by":"crossref","unstructured":"Yan C, Ding A, Zhang Y, Wang Z (2021) Learning fashion similarity based on hierarchical attribute embedding. In: Proceedings of the 8th International Conference on Data Science and Advanced Analytics, pp 1\u20138. IEEE","DOI":"10.1109\/DSAA53316.2021.9564236"},{"key":"6173_CR15","doi-asserted-by":"crossref","unstructured":"Yan C, Yan K, Zhang Y, Wan Y, Zhu D (2022) Attribute-guided fashion image retrieval by iterative similarity learning. In: Proceedings of the 2022 IEEE International Conference on Multimedia and Expo, pp 1\u20136. IEEE","DOI":"10.1109\/ICME52920.2022.9859953"},{"key":"6173_CR16","doi-asserted-by":"crossref","unstructured":"Ma Z, Dong J, Long Z, Zhang Y, He Y, Xue H, Ji S (2020) Fine-grained fashion similarity learning by attribute-specific embedding network. In: Proceedings of the AAAI Conference on Artificial Intelligence, pp 11741\u201311748","DOI":"10.1609\/aaai.v34i07.6845"},{"key":"6173_CR17","doi-asserted-by":"publisher","first-page":"8410","DOI":"10.1109\/TIP.2021.3115658","volume":"30","author":"J Dong","year":"2021","unstructured":"Dong J, Ma Z, Mao X, Yang X, He Y, Hong R, Ji S (2021) Fine-grained fashion similarity prediction by attribute-specific embedding learning. IEEE Trans Image Process 30:8410\u20138425","journal-title":"IEEE Trans Image Process"},{"key":"6173_CR18","doi-asserted-by":"crossref","unstructured":"Dong J, Peng X, Ma Z, Liu D, Qu X, Yang X, Zhu J, Liu B (2023) From region to patch: Attribute-aware foreground-background contrastive learning for fine-grained fashion retrieval. In: Proceedings of the 46th International ACM SIGIR Conference on Research and Development in Information Retrieval, pp 1273\u20131282","DOI":"10.1145\/3539618.3591690"},{"issue":"4","key":"6173_CR19","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3624733","volume":"56","author":"Y Deldjoo","year":"2023","unstructured":"Deldjoo Y, Nazary F, Ramisa A, Mcauley J, Pellegrini G, Bellogin A, Noia TD (2023) A review of modern fashion recommender systems. ACM Comput Surv 56(4):1\u201337","journal-title":"ACM Comput Surv"},{"key":"6173_CR20","doi-asserted-by":"crossref","unstructured":"Tan F, Yuan J, Ordonez V (2021) Instance-level image retrieval using reranking transformers. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp 12105\u201312115","DOI":"10.1109\/ICCV48922.2021.01189"},{"key":"6173_CR21","unstructured":"Krizhevsky A, Sutskever I, Hinton GE (2012) Imagenet classification with deep convolutional neural networks. In: Proceedings of the Advances in Neural Information Processing Systems, pp 1097\u20131105"},{"key":"6173_CR22","unstructured":"Dosovitskiy A, Beyer L, Kolesnikov A, Weissenborn D, Zhai X, Unterthiner T, Dehghani M, Minderer M, Heigold G, Gelly S et al (2020) An image is worth 16x16 words: Transformers for image recognition at scale. arXiv preprint arXiv:2010.11929"},{"key":"6173_CR23","doi-asserted-by":"publisher","first-page":"2309","DOI":"10.1109\/TIP.2023.3266166","volume":"32","author":"J Yin","year":"2023","unstructured":"Yin J, Zhang X, Ma Z, Guo J, Liu Y (2023) A real-time memory updating strategy for unsupervised person re-identification. IEEE Trans Image Process 32:2309\u20132321","journal-title":"IEEE Trans Image Process"},{"key":"6173_CR24","doi-asserted-by":"crossref","unstructured":"Dai Z, Wang G, Yuan W, Zhu S, Tan P (2022) Cluster contrast for unsupervised person re-identification. In: Proceedings of the Asian Conference on Computer Vision, pp 1142\u20131160","DOI":"10.1007\/978-3-031-26351-4_20"},{"key":"6173_CR25","doi-asserted-by":"crossref","unstructured":"He K, Fan H, Wu Y, Xie S, Girshick R (2020) Momentum contrast for unsupervised visual representation learning. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 9729\u20139738","DOI":"10.1109\/CVPR42600.2020.00975"},{"key":"6173_CR26","unstructured":"Shen X, Xiao Y, Hu SX, Sbai O, Aubry M (2021) Re-ranking for image retrieval and transductive few-shot classification. In: Proceedings of the Advances in Neural Information Processing Systems, pp 25932\u201325943"},{"key":"6173_CR27","doi-asserted-by":"crossref","unstructured":"Zou X, Kong X, Wong W, Wang C, Liu Y, Cao Y (2019) Fashionai: A hierarchical dataset for fashion understanding. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops, pp 296\u2013304","DOI":"10.1109\/CVPRW.2019.00039"},{"key":"6173_CR28","doi-asserted-by":"crossref","unstructured":"Huang J, Feris RS, Chen Q, Yan S (2015) Cross-domain image retrieval with a dual attribute-aware ranking network. In: Proceedings of the IEEE International Conference on Computer Vision, pp 1062\u20131070","DOI":"10.1109\/ICCV.2015.127"},{"key":"6173_CR29","doi-asserted-by":"crossref","unstructured":"Liu Z, Luo P, Qiu S, Wang X, Tang X (2016) Deepfashion: Powering robust clothes recognition and retrieval with rich annotations. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp 1096\u20131104","DOI":"10.1109\/CVPR.2016.124"},{"key":"6173_CR30","doi-asserted-by":"crossref","unstructured":"Kang W-C, Kim E, Leskovec J, Rosenberg C, McAuley J (2019) Complete the look: Scene-based complementary product recommendation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 10532\u201310541","DOI":"10.1109\/CVPR.2019.01078"},{"key":"6173_CR31","doi-asserted-by":"crossref","unstructured":"Ji X, Wang W, Zhang M, Yang Y (2017) Cross-domain image retrieval with attention modeling. In: Proceedings of the 25th ACM International Conference on Multimedia, pp 1654\u20131662","DOI":"10.1145\/3123266.3123429"},{"key":"6173_CR32","doi-asserted-by":"crossref","unstructured":"Han X, Wu Z, Jiang Y-G, Davis LS (2017) Learning fashion compatibility with bidirectional lstms. In: Proceedings of the 25th ACM International Conference on Multimedia, pp 1078\u20131086","DOI":"10.1145\/3123266.3123394"},{"key":"6173_CR33","doi-asserted-by":"crossref","unstructured":"Li Y, Hu P, Liu Z, Peng D, Zhou JT, Peng X (2021) Contrastive clustering. In: Proceedings of the AAAI Conference on Artificial Intelligence, pp 8547\u20138555","DOI":"10.1609\/aaai.v35i10.17037"},{"key":"6173_CR34","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, Sun J (2016) Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"key":"6173_CR35","doi-asserted-by":"crossref","unstructured":"Hu J, Shen L, Sun G (2018) Squeeze-and-excitation networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp 7132\u20137141","DOI":"10.1109\/CVPR.2018.00745"},{"key":"6173_CR36","unstructured":"Ba JL, Kiros JR, Hinton GE (2016) Layer normalization. arXiv preprint arXiv:1607.06450"},{"key":"6173_CR37","doi-asserted-by":"crossref","unstructured":"Zhan X, Xie J, Liu Z, Ong Y-S, Loy CC (2020) Online deep clustering for unsupervised representation learning. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 6688\u20136697","DOI":"10.1109\/CVPR42600.2020.00672"},{"key":"6173_CR38","first-page":"1","volume":"60","author":"Z Yuan","year":"2022","unstructured":"Yuan Z, Zhang W, Tian C, Rong X, Zhang Z, Wang H, Fu K, Sun X (2022) Remote sensing cross-modal text-image retrieval based on global and local information. IEEE Trans Geosci Remote Sens 60:1\u201316","journal-title":"IEEE Trans Geosci Remote Sens"},{"issue":"12","key":"6173_CR39","doi-asserted-by":"publisher","first-page":"5468","DOI":"10.1109\/TNNLS.2020.2968289","volume":"31","author":"D Gong","year":"2020","unstructured":"Gong D, Zhang Z, Shi Q, Hengel A, Shen C, Zhang Y (2020) Learning deep gradient descent optimization for image deconvolution. IEEE Trans Neural Netw Learn Syst 31(12):5468\u20135482","journal-title":"IEEE Trans Neural Netw Learn Syst"},{"key":"6173_CR40","unstructured":"Huang Z, Wang Y, Li C, He H (2022) Going deeper into permutation-sensitive graph neural networks. In: Proceedings of the International Conference on Machine Learning, pp 9377\u20139409"},{"issue":"1","key":"6173_CR41","doi-asserted-by":"publisher","first-page":"33","DOI":"10.1007\/s10107-010-0402-6","volume":"129","author":"S Kim","year":"2011","unstructured":"Kim S, Kojima M, Mevissen M, Yamashita M (2011) Exploiting sparsity in linear and nonlinear matrix inequalities via positive semidefinite matrix completion. Math Program 129(1):33\u201368","journal-title":"Math Program"},{"key":"6173_CR42","unstructured":"Pavllo D, Grangier D, Auli M (2018) Quaternet: A quaternion-based recurrent model for human motion. arXiv preprint arXiv:1805.06485"},{"key":"6173_CR43","doi-asserted-by":"crossref","unstructured":"Dong X, Shen J (2018) Triplet loss in siamese network for object tracking. In: Proceedings of the European Conference on Computer Vision, pp 459\u2013474","DOI":"10.1007\/978-3-030-01261-8_28"},{"key":"6173_CR44","unstructured":"Oord Avd, Li Y, Vinyals O (2018) Representation learning with contrastive predictive coding. arXiv preprint arXiv:1807.03748"},{"key":"6173_CR45","doi-asserted-by":"crossref","unstructured":"Xiao L, Zhang X, Yamasaki T (2023) Toward a more robust fine-grained fashion retrieval. In: Proceedings of the 6th International Conference on Multimedia Information Processing and Retrieval, pp 1\u20134","DOI":"10.1109\/MIPR59079.2023.00031"},{"key":"6173_CR46","doi-asserted-by":"crossref","unstructured":"Deng J, Dong W, Socher R, Li L-J, Li K, Fei-Fei L (2009) Imagenet: A large-scale hierarchical image database. In: Proceedings of the 2009 IEEE Conference on Computer Vision and Pattern Recognition, pp 248\u2013255","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"6173_CR47","doi-asserted-by":"crossref","unstructured":"Schroff F, Kalenichenko D, Philbin J (2015) Facenet: A unified embedding for face recognition and clustering. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp 815\u2013823","DOI":"10.1109\/CVPR.2015.7298682"},{"key":"6173_CR48","doi-asserted-by":"crossref","unstructured":"Jalwana MA, Akhtar N, Bennamoun M, Mian A (2021) Cameras: Enhanced resolution and sanity preserving class activation mapping for image saliency. In: Proceedings of the\u00a0IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp 16327\u201316336","DOI":"10.1109\/CVPR46437.2021.01606"}],"container-title":["Applied Intelligence"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-024-06173-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10489-024-06173-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-024-06173-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,2,22]],"date-time":"2025-02-22T17:21:01Z","timestamp":1740244861000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10489-024-06173-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,1,13]]},"references-count":48,"journal-issue":{"issue":"5","published-print":{"date-parts":[[2025,4]]}},"alternative-id":["6173"],"URL":"https:\/\/doi.org\/10.1007\/s10489-024-06173-8","relation":{},"ISSN":["0924-669X","1573-7497"],"issn-type":[{"value":"0924-669X","type":"print"},{"value":"1573-7497","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,1,13]]},"assertion":[{"value":"8 December 2024","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"13 January 2025","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they comply with ethical and informed consent for data used.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical and informed consent for data used"}},{"value":"The authors declare that they have no known competing financial interests or personal relationships that could have appeared to influence the work reported in this paper.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"302"}}