{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,27]],"date-time":"2026-05-27T14:43:55Z","timestamp":1779893035726,"version":"3.53.1"},"reference-count":55,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"1","license":[{"start":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T00:00:00Z","timestamp":1577836800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61671196"],"award-info":[{"award-number":["61671196"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61525206"],"award-info":[{"award-number":["61525206"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61701149"],"award-info":[{"award-number":["61701149"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Shenzhen Fundamental Research fund","award":["JCYJ20180306174120445"],"award-info":[{"award-number":["JCYJ20180306174120445"]}]},{"name":"Shenzhen Fundamental Research fund","award":["JCYJ20160331185006518"],"award-info":[{"award-number":["JCYJ20160331185006518"]}]},{"name":"Zhejiang Province Nature Science Foundation of China","award":["LR17F030006"],"award-info":[{"award-number":["LR17F030006"]}]},{"DOI":"10.13039\/501100012166","name":"National Basic Research Program of China","doi-asserted-by":"publisher","award":["2017YFC0820600"],"award-info":[{"award-number":["2017YFC0820600"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100012166","name":"National Basic Research Program of China","doi-asserted-by":"publisher","award":["2017YFC0820605"],"award-info":[{"award-number":["2017YFC0820605"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100012166","name":"National Basic Research Program of China","doi-asserted-by":"publisher","award":["2017YFC0820604"],"award-info":[{"award-number":["2017YFC0820604"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100009019","name":"Shenzhen University","doi-asserted-by":"publisher","award":["2019041"],"award-info":[{"award-number":["2019041"]}],"id":[{"id":"10.13039\/501100009019","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Multimedia"],"published-print":{"date-parts":[[2020,1]]},"DOI":"10.1109\/tmm.2019.2924576","type":"journal-article","created":{"date-parts":[[2019,6,25]],"date-time":"2019-06-25T16:42:50Z","timestamp":1561480970000},"page":"229-241","source":"Crossref","is-referenced-by-count":314,"title":["STAT: Spatial-Temporal Attention Mechanism for Video Captioning"],"prefix":"10.1109","volume":"22","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-1204-0512","authenticated-orcid":false,"given":"Chenggang","family":"Yan","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9525-9060","authenticated-orcid":false,"given":"Yunbin","family":"Tu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4080-6888","authenticated-orcid":false,"given":"Xingzheng","family":"Wang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3320-2904","authenticated-orcid":false,"given":"Yongbing","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6448-4839","authenticated-orcid":false,"given":"Xinhong","family":"Hao","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1151-1792","authenticated-orcid":false,"given":"Yongdong","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Qionghai","family":"Dai","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.571"},{"key":"ref38","first-page":"190","article-title":"Collecting highly parallel data for paraphrase evaluation","author":"chen","year":"0","journal-title":"Proc 49th Ann Meeting of the Assoc for Computational Linguistics Human Language Technologies?Volume 1"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-05710-7_4"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2018.2846664"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1145\/3123266.3123354"},{"key":"ref30","article-title":"Video captioning with recurrent networks based on frame-and video-level features and visual content classification","author":"shetty","year":"2015"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.508"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.497"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.503"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298935"},{"key":"ref28","first-page":"77","article-title":"Show, attend and tell: Neural image caption generation with visual attention","volume":"14","author":"xu","year":"2015","journal-title":"ICML"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0158664"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.662"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2011.2177646"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2017.2729019"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/N15-1173"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2017.2749977"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2018.2855422"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2017.2749977"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2017.2749965"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0162939"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/LSP.2014.2310494"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1162"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1145\/2964284.2984062"},{"key":"ref55","article-title":"ADADELTA: An adaptive learning rate method","author":"zeiler","year":"2012"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1145\/2964284.2984064"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1145\/2964284.2984066"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1145\/2964284.2984065"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.117"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.512"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.3115\/1073083.1073135"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.496"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2015.2443556"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2003.811617"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2004.840598"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2008.2004912"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2018.2808685"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2018\/365"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2018\/157"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2010.2089504"},{"key":"ref3","doi-asserted-by":"crossref","first-page":"421","DOI":"10.1109\/TMM.2008.917346","article-title":"A novel framework for semantic annotation and personalized retrieval of sports video","volume":"10","author":"xu","year":"2008","journal-title":"IEEE Trans Multimedia"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2018.2814344"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2017.2751140"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2017.2722687"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2015.2482228"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2577031"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.450"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.510"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.81"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.223"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7299087"},{"key":"ref41","first-page":"376","article-title":"Meteor universal: Language specific translation evaluation for any target language","author":"lavie","year":"0","journal-title":"Proc Workshop Statist Mach Translation"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"ref43","article-title":"Microsoft coco captions: Data collection and evaluation server","author":"chen","year":"2015"}],"container-title":["IEEE Transactions on Multimedia"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6046\/8949825\/08744407.pdf?arnumber=8744407","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,1,12]],"date-time":"2022-01-12T16:16:00Z","timestamp":1642004160000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8744407\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,1]]},"references-count":55,"journal-issue":{"issue":"1"},"URL":"https:\/\/doi.org\/10.1109\/tmm.2019.2924576","relation":{},"ISSN":["1520-9210","1941-0077"],"issn-type":[{"value":"1520-9210","type":"print"},{"value":"1941-0077","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,1]]}}}