{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,27]],"date-time":"2026-02-27T02:39:23Z","timestamp":1772159963812,"version":"3.50.1"},"reference-count":32,"publisher":"Springer Science and Business Media LLC","issue":"17","license":[{"start":{"date-parts":[[2021,4,24]],"date-time":"2021-04-24T00:00:00Z","timestamp":1619222400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,4,24]],"date-time":"2021-04-24T00:00:00Z","timestamp":1619222400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100003401","name":"Funda\u00e7\u00e3o&nbsp;de&nbsp;Amparo&nbsp;\u00e0&nbsp;Pesquisa&nbsp;do&nbsp;Estado&nbsp;de&nbsp;Alagoas","doi-asserted-by":"publisher","award":["60030001626\/2018"],"award-info":[{"award-number":["60030001626\/2018"]}],"id":[{"id":"10.13039\/501100003401","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"published-print":{"date-parts":[[2021,7]]},"DOI":"10.1007\/s11042-021-10885-1","type":"journal-article","created":{"date-parts":[[2021,4,25]],"date-time":"2021-04-25T05:01:17Z","timestamp":1619326877000},"page":"25851-25873","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":11,"title":["Multimodal deep neural networks for attribute prediction and applications to e-commerce catalogs enhancement"],"prefix":"10.1007","volume":"80","author":[{"given":"Luiz Felipe","family":"Sales","sequence":"first","affiliation":[]},{"given":"Artur","family":"Pereira","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7775-5258","authenticated-orcid":false,"given":"Thales","family":"Vieira","sequence":"additional","affiliation":[]},{"given":"Evandro","family":"de Barros Costa","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2021,4,24]]},"reference":[{"issue":"10","key":"10885_CR1","doi-asserted-by":"publisher","first-page":"308","DOI":"10.3390\/info10100308","volume":"10","author":"HS Arslan","year":"2019","unstructured":"Arslan HS, Sirts K, Fishel M, Anbarjafari G (2019) Multimodal sequential fashion attribute prediction. Information 10(10):308","journal-title":"Information"},{"key":"10885_CR2","unstructured":"Bracher C, Heinz S, Vollgraf R (2016) Fashion DNA: merging content and sales data for recommendation and article mapping. CoRR arXiv:1609.02489"},{"key":"10885_CR3","doi-asserted-by":"publisher","unstructured":"Cardoso \u00c2, Daolio F, Vargas S (2018) Product characterisation towards personalisation: learning attributes from unstructured data to recommend fashion products. In: Proceedings of the 24th ACM SIGKDD international conference on knowledge discovery & data mining, KDD 2018, London, UK, August 19-23, 2018. https:\/\/doi.org\/10.1145\/3219819.3219888, pp 80\u201389","DOI":"10.1145\/3219819.3219888"},{"key":"10885_CR4","doi-asserted-by":"crossref","unstructured":"Chen MX, Firat O, Bapna A, Johnson M, Macherey W, Foster G, Jones L, Parmar N, Schuster M, Chen Z et al (2018) The best of both worlds: combining recent advances in neural machine translation. arXiv:1804.09849","DOI":"10.18653\/v1\/P18-1008"},{"key":"10885_CR5","unstructured":"Chollet F et al (2015) Keras. https:\/\/github.com\/fchollet\/keras"},{"key":"10885_CR6","unstructured":"Dai AM, Olah C, Le QV (2015) Document embedding with paragraph vectors"},{"key":"10885_CR7","doi-asserted-by":"crossref","unstructured":"Dasgupta R, Tom F, Kumar S, Das Gupta M, Kumar Y, Patro BN, Namboodiri VP (2020) Visually precise query. In: Proceedings of the 28th ACM international conference on multimedia. ACM, pp 3550\u20133558","DOI":"10.1145\/3394171.3413558"},{"key":"10885_CR8","doi-asserted-by":"crossref","unstructured":"Deng J, Dong W, Socher R, Li LJ, Li K, Fei-Fei L (2009) Imagenet: a large-scale hierarchical image database. In: 2009 IEEE Conference on computer vision and pattern recognition. IEEE, pp 248\u2013255","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"10885_CR9","unstructured":"Devlin J, Chang MW, Lee K, Toutanova K (2018) Bert: Pre-training of deep bidirectional transformers for language understanding. arXiv:1810.04805"},{"key":"10885_CR10","doi-asserted-by":"crossref","unstructured":"Fensel D (2001) Challenges in content management for b2b electronic commerce. In: Proceedings second international workshop on user interfaces in data intensive systems. UIDIS 2001. IEEE, pp 2\u20134","DOI":"10.1109\/UIDIS.2001.929920"},{"key":"10885_CR11","unstructured":"Frome A, Corrado GS, Shlens J, Bengio S, Dean J, Ranzato MA, Mikolov T (2013) Devise: a deep visual-semantic embedding model. In: Burges CJC, Bottou L, Welling M, Ghahramani Z, Weinberger KQ (eds) Advances in neural information processing systems. http:\/\/papers.nips.cc\/paper\/5204-devise-a-deep-visual-semantic-embedding-model.pdf, vol 26. Curran Associates, Inc., pp 2121\u20132129"},{"key":"10885_CR12","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, Sun J (2015) Deep residual learning for image recognition. CoRR arXiv:1512.03385","DOI":"10.1109\/CVPR.2016.90"},{"key":"10885_CR13","doi-asserted-by":"crossref","unstructured":"He K, Zhang X, Ren S, Sun J (2016) Deep residual learning for image recognition. In: Proceedings of the IEEE conference on computer vision and pattern recognition, pp 770\u2013778","DOI":"10.1109\/CVPR.2016.90"},{"key":"10885_CR14","doi-asserted-by":"crossref","unstructured":"Inoue N, Simo-Serra E, Yamasaki T, Ishikawa H (2017) Multi-label fashion image classification with minimal human supervision. In: 2017 IEEE international conference on computer vision workshops (ICCVW), pp 2261\u20132267","DOI":"10.1109\/ICCVW.2017.265"},{"key":"10885_CR15","volume-title":"Speech and language processing: an introduction to natural language processing. Computational Linguistics and Speech Recognition","author":"D Jurasky","year":"2000","unstructured":"Jurasky D, Martin JH (2000) Speech and language processing: an introduction to natural language processing. Computational Linguistics and Speech Recognition. Prentice Hall, New Jersey"},{"key":"10885_CR16","doi-asserted-by":"publisher","unstructured":"Katarya R, Arora Y (2020) Capsmf: a novel product recommender system using deep learning based text analysis model. Multimedia Tools and Applications. https:\/\/doi.org\/10.1007\/s11042-020-09199-5","DOI":"10.1007\/s11042-020-09199-5"},{"key":"10885_CR17","doi-asserted-by":"publisher","unstructured":"Kim Y (2014) Convolutional neural networks for sentence classification. In: Proceedings of the 2014 conference on empirical methods in natural language processing (EMNLP). https:\/\/doi.org\/10.3115\/v1\/D14-1181. https:\/\/www.aclweb.org\/anthology\/D14-1181. Association for Computational Linguistics, Doha, pp 1746\u20131751","DOI":"10.3115\/v1\/D14-1181"},{"key":"10885_CR18","unstructured":"Kingma DP, Ba J (2014) Adam: a method for stochastic optimization. arXiv:1412.6980"},{"key":"10885_CR19","unstructured":"Laenen K, Zoghbi S, Moens MF (2017) Cross-modal search for fashion attributes. In: Proceedings of the KDD 2017 workshop on machine learning meets fashion. ACM"},{"key":"10885_CR20","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1016\/j.neucom.2016.12.038","volume":"234","author":"W Liu","year":"2017","unstructured":"Liu W, Wang Z, Liu X, Zeng N, Liu Y, Alsaadi FE (2017) A survey of deep neural network architectures and their applications. Neurocomputing 234:11\u201326","journal-title":"Neurocomputing"},{"key":"10885_CR21","doi-asserted-by":"crossref","unstructured":"Liu Z, Luo P, Qiu S, Wang X, Tang X (2016) Deepfashion: powering robust clothes recognition and retrieval with rich annotations. In: 2016 IEEE Conference on computer vision and pattern recognition (CVPR), pp 1096\u20131104","DOI":"10.1109\/CVPR.2016.124"},{"key":"10885_CR22","doi-asserted-by":"publisher","first-page":"12","DOI":"10.1016\/j.dss.2015.03.008","volume":"74","author":"J Lu","year":"2015","unstructured":"Lu J, Wu D, Mao M, Wang W, Zhang G (2015) Recommender system application developments: a survey. Decis Support Syst 74:12\u201332","journal-title":"Decis Support Syst"},{"key":"10885_CR23","unstructured":"Ruder S (2016) An overview of gradient descent optimization algorithms. CoRR arXiv:1609.04747"},{"key":"10885_CR24","unstructured":"Schindler A, Lidy T, Karner S, Hecker M (2018) Fashion and apparel classification using convolutional neural networks. CoRR arXiv:1811.04374"},{"key":"10885_CR25","unstructured":"Simonyan K, Zisserman A (2014) Very deep convolutional networks for large-scale image recognition. arXiv:1409.1556"},{"key":"10885_CR26","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s11042-017-5245-1","volume":"77","author":"GL Sun","year":"2017","unstructured":"Sun GL, Cheng ZQ, Wu X, Peng Q (2017) Personalized clothing recommendation combining user social circle and fashion style consistency. Multimedia Tools and Applications 77:1\u201324. https:\/\/doi.org\/10.1007\/s11042-017-5245-1","journal-title":"Multimedia Tools and Applications"},{"key":"10885_CR27","unstructured":"Szegedy C, Ioffe S, Vanhoucke V (2016) Inception-v4, inception-resnet and the impact of residual connections on learning. CoRR arXiv:1602.07261"},{"key":"10885_CR28","doi-asserted-by":"crossref","unstructured":"Szegedy C, Liu W, Jia Y, Sermanet P, Reed SE, Anguelov D, Erhan D, Vanhoucke V, Rabinovich A (2014) Going deeper with convolutions. CoRR arXiv:1409.4842","DOI":"10.1109\/CVPR.2015.7298594"},{"issue":"3","key":"10885_CR29","doi-asserted-by":"publisher","first-page":"55","DOI":"10.1109\/MCI.2018.2840738","volume":"13","author":"T Young","year":"2018","unstructured":"Young T, Hazarika D, Poria S, Cambria E (2018) Recent trends in deep learning based natural language processing [review article]. IEEE Comput Intell Mag 13(3):55\u201375","journal-title":"IEEE Comput Intell Mag"},{"key":"10885_CR30","doi-asserted-by":"crossref","unstructured":"Yu L, Simo-Serra E, Moreno-Noguer F, Rubio A (2017) Multi-modal embedding for main product detection in fashion. In: 2017 IEEE international conference on computer vision workshops (ICCVW), pp 2236\u20132242","DOI":"10.1109\/ICCVW.2017.261"},{"key":"10885_CR31","doi-asserted-by":"crossref","unstructured":"Yu W, Zhang H, He X, Chen X, Xiong L, Qin Z (2018) Aesthetic-based clothing recommendation. In: Proceedings of the 2018 world wide web conference, pp 649\u2013658","DOI":"10.1145\/3178876.3186146"},{"key":"10885_CR32","unstructured":"Zahavy T, Magnani A, Krishnan A, Mannor S (2016) Is a picture worth a thousand words? A deep multi-modal fusion architecture for product classification in e-commerce. CoRR arXiv:1611.09534"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-021-10885-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-021-10885-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-021-10885-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,7,6]],"date-time":"2021-07-06T06:14:05Z","timestamp":1625552045000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-021-10885-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,4,24]]},"references-count":32,"journal-issue":{"issue":"17","published-print":{"date-parts":[[2021,7]]}},"alternative-id":["10885"],"URL":"https:\/\/doi.org\/10.1007\/s11042-021-10885-1","relation":{},"ISSN":["1380-7501","1573-7721"],"issn-type":[{"value":"1380-7501","type":"print"},{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021,4,24]]},"assertion":[{"value":"13 August 2020","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 February 2021","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"1 April 2021","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"24 April 2021","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"<!--Emphasis Type='Bold' removed-->Conflict of Interests"}}]}}