{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,12]],"date-time":"2026-04-12T06:46:27Z","timestamp":1775976387294,"version":"3.50.1"},"reference-count":101,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62125102"],"award-info":[{"award-number":["62125102"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100012226","name":"Fundamental Research Funds for the Central Universities","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100012226","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Geosci. Remote Sensing"],"published-print":{"date-parts":[[2022]]},"DOI":"10.1109\/tgrs.2022.3218921","type":"journal-article","created":{"date-parts":[[2022,11,4]],"date-time":"2022-11-04T01:33:42Z","timestamp":1667525622000},"page":"1-20","source":"Crossref","is-referenced-by-count":134,"title":["Remote Sensing Image Change Captioning With Dual-Branch Transformers: A New Method and a Large Scale Dataset"],"prefix":"10.1109","volume":"60","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-3034-6646","authenticated-orcid":false,"given":"Chenyang","family":"Liu","sequence":"first","affiliation":[{"name":"Image Processing Center, School of Astronautics, Beihang University, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4271-0206","authenticated-orcid":false,"given":"Rui","family":"Zhao","sequence":"additional","affiliation":[{"name":"Fuxi AI Laboratory, NetEase, Hangzhou, Zhejiang, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6418-3761","authenticated-orcid":false,"given":"Hao","family":"Chen","sequence":"additional","affiliation":[{"name":"Image Processing Center, School of Astronautics, Beihang University, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1774-552X","authenticated-orcid":false,"given":"Zhengxia","family":"Zou","sequence":"additional","affiliation":[{"name":"Department of Guidance, Navigation and Control, School of Astronautics, Beihang University, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4772-3172","authenticated-orcid":false,"given":"Zhenwei","family":"Shi","sequence":"additional","affiliation":[{"name":"Image Processing Center, School of Astronautics, Beihang University, Beijing, China"}]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1016\/j.rse.2015.01.006"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1080\/01431161.2012.700424"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1016\/0034-4257(95)00233-2"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2006.888195"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1016\/S0034-4257(97)00162-4"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/LGRS.2009.2025059"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1080\/014311698215612"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1016\/j.patrec.2004.06.002"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1080\/01431160500057889"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1016\/j.apgeog.2010.10.012"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.3390\/rs3112473"},{"key":"ref27","first-page":"385","article-title":"Change vector analysis: An approach for detecting forest changes with Landsat","author":"malila","year":"1980","journal-title":"Proc LARS Symposia"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1080\/01431160801950162"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.215"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2022.3195692"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/IGARSS47720.2021.9554419"},{"key":"ref24","first-page":"1","article-title":"ViLBERT: Pretraining task-agnostic visiolinguistic representations for vision-and-language tasks","volume":"32","author":"lu","year":"2019","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/72.788640"},{"key":"ref101","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D17-1154"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/LGRS.2016.2606119"},{"key":"ref100","doi-asserted-by":"publisher","DOI":"10.1613\/jair.1.12007"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/CIIS.2017.54"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.3390\/rs12030484"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/LGRS.2020.2988032"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2012.162"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-34500-5_24"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2017.2677464"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.3008036"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.3390\/rs12101688"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"ref53","first-page":"234","article-title":"U-Net: Convolutional networks for biomedical image segmentation","author":"ronneberger","year":"2015","journal-title":"Proc Int Conf Med Image Comput Comput -Assist Intervent"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2021.3127580"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/LGRS.2017.2738149"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2017.2707528"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.3390\/rs12060901"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1080\/01431160110104728"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.3390\/rs12101662"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2019.2931223"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/JSTARS.2020.3037893"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D18-1436"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2019.2957513"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2022.3160007"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2021.3095166"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/LGRS.2020.3035780"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2021.3066802"},{"key":"ref42","first-page":"4063","article-title":"Fully convolutional Siamese networks for change detection","author":"caye daudt","year":"2018","journal-title":"Proc 25th IEEE Int Conf Image Process (ICIP)"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.3390\/rs11111382"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2019.2956756"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/LGRS.2020.3041530"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1109\/LGRS.2022.3150957"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN48605.2020.9207381"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.3390\/rs12060939"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1109\/LGRS.2020.3009243"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1109\/JSTARS.2022.3153636"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2019.2951636"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.1109\/LGRS.2021.3135711"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2021.3102590"},{"key":"ref78","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR48806.2021.9412486"},{"key":"ref79","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2021.3105004"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-15561-1_2"},{"key":"ref62","first-page":"1","article-title":"DeViSE: A deep visual-semantic embedding model","volume":"26","author":"frome","year":"2013","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref61","first-page":"1","article-title":"Im2Text: Describing images using 1 million captioned photographs","volume":"24","author":"ordonez","year":"2011","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref63","first-page":"1","article-title":"Deep fragment embeddings for bidirectional image sentence mapping","volume":"27","author":"karpathy","year":"2014","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1109\/JSTARS.2019.2959208"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1109\/LGRS.2019.2893772"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1109\/CITS.2016.7546397"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2017.2776321"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2020.3044054"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.5244\/C.29.61"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2021.3070383"},{"key":"ref1","article-title":"Building damage detection in satellite imagery using convolutional neural networks","author":"xu","year":"2019","journal-title":"arXiv 1910 06444"},{"key":"ref95","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7299087"},{"key":"ref94","article-title":"Adam: A method for stochastic optimization","author":"kingma","year":"2014","journal-title":"arXiv 1412 6980"},{"key":"ref93","article-title":"An image is worth 16&#x00D7;16 words: Transformers for image recognition at scale","author":"dosovitskiy","year":"2020","journal-title":"arXiv 2010 11929"},{"key":"ref92","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"ref91","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref90","article-title":"Layer normalization","author":"lei ba","year":"2016","journal-title":"arXiv 1607 06450"},{"key":"ref98","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W17-3207"},{"key":"ref99","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D17-2021"},{"key":"ref96","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58568-6_34"},{"key":"ref97","article-title":"Very deep convolutional networks for large-scale image recognition","author":"simonyan","year":"2014","journal-title":"arXiv 1409 1556"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/LRA.2020.3003290"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1145\/3474085.3475712"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00472"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.findings-acl.6"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00275"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2022.3154154"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00210"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2021.3132095"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00198"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1109\/LGRS.2022.3198234"},{"key":"ref18","first-page":"2048","article-title":"Show, attend and tell: Neural image caption generation with visual attention","author":"xu","year":"2015","journal-title":"Proc 32nd Int Conf Mach Learn"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2021.3128140"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.8.1735"},{"key":"ref83","first-page":"1","article-title":"Attention is all you need","volume":"30","author":"vaswani","year":"2017","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref80","doi-asserted-by":"publisher","DOI":"10.1109\/LGRS.2022.3192062"},{"key":"ref89","doi-asserted-by":"publisher","DOI":"10.3115\/1626355.1626389"},{"key":"ref85","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2022.3148210"},{"key":"ref86","article-title":"Microsoft COCO captions: Data collection and evaluation server","author":"chen","year":"2015","journal-title":"arXiv 1504 00325"},{"key":"ref87","doi-asserted-by":"publisher","DOI":"10.3115\/1073083.1073135"},{"key":"ref88","article-title":"ROUGE: A package for automatic evaluation of summaries","author":"yew","year":"2004","journal-title":"Proc Workshop Text Summarization Branches Out (WAS)"}],"container-title":["IEEE Transactions on Geoscience and Remote Sensing"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/36\/9633014\/09934924.pdf?arnumber=9934924","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,12,12]],"date-time":"2022-12-12T19:32:19Z","timestamp":1670873539000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9934924\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022]]},"references-count":101,"URL":"https:\/\/doi.org\/10.1109\/tgrs.2022.3218921","relation":{},"ISSN":["0196-2892","1558-0644"],"issn-type":[{"value":"0196-2892","type":"print"},{"value":"1558-0644","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022]]}}}