{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,4,9]],"date-time":"2025-04-09T17:34:54Z","timestamp":1744220094509,"version":"3.28.0"},"reference-count":32,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,9]]},"DOI":"10.1109\/bigmm.2018.8499060","type":"proceedings-article","created":{"date-parts":[[2018,10,23]],"date-time":"2018-10-23T00:35:25Z","timestamp":1540254925000},"page":"1-5","source":"Crossref","is-referenced-by-count":2,"title":["Spatial- Temporal Attention for Image Captioning"],"prefix":"10.1109","author":[{"given":"Junwei","family":"Zhou","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xi","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jizhong","family":"Han","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Songlin","family":"Hu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hongchao","family":"Gao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"doi-asserted-by":"publisher","key":"ref32","DOI":"10.1109\/CVPR.2016.503"},{"doi-asserted-by":"publisher","key":"ref31","DOI":"10.1109\/CVPR.2017.559"},{"doi-asserted-by":"publisher","key":"ref30","DOI":"10.1109\/CVPR.2016.10"},{"doi-asserted-by":"publisher","key":"ref10","DOI":"10.1109\/CVPR.2016.494"},{"doi-asserted-by":"publisher","key":"ref11","DOI":"10.1109\/CVPR.2015.7298932"},{"key":"ref12","first-page":"1097","article-title":"Imagenet classification with deep convolutional neural networks","author":"krizhevsky","year":"2012","journal-title":"Advances in neural information processing systems"},{"doi-asserted-by":"publisher","key":"ref13","DOI":"10.3115\/1626355.1626389"},{"doi-asserted-by":"publisher","key":"ref14","DOI":"10.1109\/5.726791"},{"key":"ref15","first-page":"4133","article-title":"Image caption with global-local attention","author":"li","year":"2017","journal-title":"AAAI"},{"key":"ref16","article-title":"Rouge: A package for automatic evaluation of summaries","volume":"8","author":"lin","year":"2004","journal-title":"Text Summarization Branches Out Proceedings of the ACL-04 Workshop"},{"year":"2016","author":"lu","journal-title":"Knowing when to look Adaptive attention via a visual sentinel for image captioning","key":"ref17"},{"key":"ref18","first-page":"289","article-title":"Hierarchical question-image co-attention for visual question answering","author":"lu","year":"2016","journal-title":"Advances in neural information processing systems"},{"year":"2014","author":"mao","journal-title":"Deep captioning with multimodal recurrent neural networks (m-rnn)","key":"ref19"},{"key":"ref28","first-page":"2397","article-title":"Dynamic memory networks for visual and textual question answering","author":"xiong","year":"2016","journal-title":"International Conference on Machine Learning"},{"year":"2015","author":"chen","journal-title":"Microsoft COCO captions Data collection and evaluation server","key":"ref4"},{"year":"2016","author":"wu","journal-title":"Encode review and decode Reviewer module for caption generation","key":"ref27"},{"doi-asserted-by":"publisher","key":"ref3","DOI":"10.1109\/ICCV.2017.64"},{"doi-asserted-by":"publisher","key":"ref6","DOI":"10.1109\/CVPR.2015.7298878"},{"key":"ref29","first-page":"2048","article-title":"Show, attend and tell: Neural image caption generation with visual attention","author":"xu","year":"2015","journal-title":"International Conference on Machine Learning"},{"key":"ref5","first-page":"898","article-title":"Contrastive learning for image captioning","author":"dai","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref8","first-page":"15","article-title":"Every picture tells a story: Generating sentences from images","author":"farhadi","year":"2010","journal-title":"European Conference on Computer Vision"},{"doi-asserted-by":"publisher","key":"ref7","DOI":"10.1109\/CVPR.2015.7298754"},{"doi-asserted-by":"publisher","key":"ref2","DOI":"10.1109\/CVPR.2017.667"},{"doi-asserted-by":"publisher","key":"ref9","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref1","article-title":"Deep compositional captioning: Describing novel object categories without paired training data","author":"anne","year":"2016","journal-title":"Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition"},{"key":"ref20","first-page":"311","article-title":"Bleu: a method for automatic evaluation of machine translation","author":"papineni","year":"2002","journal-title":"Proceedings of the 40th Annual Meeting on Association for Computational Linguistics  - ACL '02"},{"year":"2014","author":"simonyan","journal-title":"Very Deep Convolutional Networks for Large-scale Image Recognition","key":"ref22"},{"year":"2017","author":"ren","journal-title":"Deep reinforcement learning-based image captioning with embedding reward","key":"ref21"},{"doi-asserted-by":"publisher","key":"ref24","DOI":"10.1109\/CVPR.2015.7299087"},{"doi-asserted-by":"publisher","key":"ref23","DOI":"10.1109\/CVPR.2015.7298594"},{"doi-asserted-by":"publisher","key":"ref26","DOI":"10.1109\/CVPR.2016.29"},{"doi-asserted-by":"publisher","key":"ref25","DOI":"10.1109\/CVPR.2015.7298935"}],"event":{"name":"2018 IEEE Fourth International Conference on Multimedia Big Data (BigMM)","start":{"date-parts":[[2018,9,13]]},"location":"Xi'an","end":{"date-parts":[[2018,9,16]]}},"container-title":["2018 IEEE Fourth International Conference on Multimedia Big Data (BigMM)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8482104\/8499056\/08499060.pdf?arnumber=8499060","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,1,26]],"date-time":"2022-01-26T21:47:17Z","timestamp":1643233637000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8499060\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,9]]},"references-count":32,"URL":"https:\/\/doi.org\/10.1109\/bigmm.2018.8499060","relation":{},"subject":[],"published":{"date-parts":[[2018,9]]}}}