{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,7]],"date-time":"2026-02-07T12:02:44Z","timestamp":1770465764374,"version":"3.49.0"},"reference-count":15,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,8,30]],"date-time":"2023-08-30T00:00:00Z","timestamp":1693353600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,8,30]],"date-time":"2023-08-30T00:00:00Z","timestamp":1693353600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,8,30]]},"DOI":"10.1109\/icac57885.2023.10275301","type":"proceedings-article","created":{"date-parts":[[2023,10,16]],"date-time":"2023-10-16T17:58:56Z","timestamp":1697479136000},"page":"1-6","source":"Crossref","is-referenced-by-count":4,"title":["Att-Sinkhorn: Multimodal Alignment with Sinkhorn-based Deep Attention Architecture"],"prefix":"10.1109","author":[{"given":"Qianxia","family":"Ma","sequence":"first","affiliation":[{"name":"Ant Group,Shanghai,China"}]},{"given":"Ming","family":"Zhang","sequence":"additional","affiliation":[{"name":"Aston University,Birmingham,UK"}]},{"given":"Yan","family":"Tang","sequence":"additional","affiliation":[{"name":"Ant Group,Hangzhou,China"}]},{"given":"Zhen","family":"Huang","sequence":"additional","affiliation":[{"name":"Ant Group,Hangzhou,China"}]}],"member":"263","reference":[{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298935"},{"key":"ref12","article-title":"Explain images with multimodal recurrent neural networks","author":"mao","year":"2014","journal-title":"ArXiv Preprint"},{"key":"ref15","first-page":"2048","article-title":"Show, attend and tell: Neural image caption generation with visual attention","author":"xu","year":"0","journal-title":"International Conference on Machine Learning"},{"key":"ref14","article-title":"Multimodal neural language models","author":"kiros","year":"0","journal-title":"International Conference on International Conference on Machine Learning"},{"key":"ref11","article-title":"Very deep convolutional networks for large-scale image recognition","author":"simonyan","year":"2014","journal-title":"ArXiv Preprint"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2019-3247"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2018.2798607"},{"key":"ref8","article-title":"Computational Optimal Transport","author":"peyr\u00e9","year":"2017","journal-title":"Center for Research in Economics and Statistics Working Papers"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-19992-4_20"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref4","doi-asserted-by":"crossref","first-page":"355","DOI":"10.1561\/2200000073","article-title":"Computational optimal transport","volume":"11","year":"2019","journal-title":"Foundations and Trends in Machine Learning"},{"key":"ref3","article-title":"Effective approaches to attention-based neural machine translation","author":"luong","year":"2015","journal-title":"Computer Science"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-32248-9_71"},{"key":"ref5","author":"zhang","year":"2020","journal-title":"A review on modern computational optimal transport methods with applications in biomedical research"}],"event":{"name":"2023 28th International Conference on Automation and Computing (ICAC)","location":"Birmingham, United Kingdom","start":{"date-parts":[[2023,8,30]]},"end":{"date-parts":[[2023,9,1]]}},"container-title":["2023 28th International Conference on Automation and Computing (ICAC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10275139\/10275143\/10275301.pdf?arnumber=10275301","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,11,6]],"date-time":"2023-11-06T18:57:57Z","timestamp":1699297077000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10275301\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,8,30]]},"references-count":15,"URL":"https:\/\/doi.org\/10.1109\/icac57885.2023.10275301","relation":{},"subject":[],"published":{"date-parts":[[2023,8,30]]}}}