{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,23]],"date-time":"2026-02-23T15:55:21Z","timestamp":1771862121124,"version":"3.50.1"},"reference-count":65,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"6","license":[{"start":{"date-parts":[[2024,6,1]],"date-time":"2024-06-01T00:00:00Z","timestamp":1717200000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2024,6,1]],"date-time":"2024-06-01T00:00:00Z","timestamp":1717200000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,6,1]],"date-time":"2024-06-01T00:00:00Z","timestamp":1717200000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"Key Project of Science and Technology Innovation and Entrepreneurship of TDTEC","award":["2021-TD-ZD002"],"award-info":[{"award-number":["2021-TD-ZD002"]}]},{"name":"Key Project of Science and Technology Innovation and Entrepreneurship of TDTEC","award":["2022-TD-ZD004"],"award-info":[{"award-number":["2022-TD-ZD004"]}]},{"name":"Key Project of Science and Technology Innovation and Entrepreneurship of TDTEC","award":["2022-2-TD-ZD001"],"award-info":[{"award-number":["2022-2-TD-ZD001"]}]},{"name":"Key Technologies R&amp;D Programme of Liaoning Province","award":["2023JH1\/10400082"],"award-info":[{"award-number":["2023JH1\/10400082"]}]},{"name":"Key Technologies R&amp;D Programme of Liaoning Province","award":["2023020456-JH\/104"],"award-info":[{"award-number":["2023020456-JH\/104"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Artif. Intell."],"published-print":{"date-parts":[[2024,6]]},"DOI":"10.1109\/tai.2023.3326416","type":"journal-article","created":{"date-parts":[[2023,10,23]],"date-time":"2023-10-23T14:40:03Z","timestamp":1698072003000},"page":"2828-2839","source":"Crossref","is-referenced-by-count":5,"title":["Text-Image Scene Graph Fusion for Multimodal Named Entity Recognition"],"prefix":"10.1109","volume":"5","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9805-8870","authenticated-orcid":false,"given":"Jian","family":"Cheng","sequence":"first","affiliation":[{"name":"Research Institute of Mine Big Data, Chinese Institute of Coal Science, State Key Laboratory for Intelligent Coal Mining and Strata Control, Beijing, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9460-0052","authenticated-orcid":false,"given":"Kaifang","family":"Long","sequence":"additional","affiliation":[{"name":"College of Software, Northeastern University, Shenyang, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-3958-7213","authenticated-orcid":false,"given":"Shuang","family":"Zhang","sequence":"additional","affiliation":[{"name":"College of Software, Northeastern University, Shenyang, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0538-1071","authenticated-orcid":false,"given":"Tian","family":"Zhang","sequence":"additional","affiliation":[{"name":"College of Software, Northeastern University, Shenyang, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9969-211X","authenticated-orcid":false,"given":"Lianbo","family":"Ma","sequence":"additional","affiliation":[{"name":"College of Software, Northeastern University, Shenyang, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5129-995X","authenticated-orcid":false,"given":"Shi","family":"Cheng","sequence":"additional","affiliation":[{"name":"College of Computer Science, Shaanxi Normal University, Xi&#x0027;an, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4276-5410","authenticated-orcid":false,"given":"Yinan","family":"Guo","sequence":"additional","affiliation":[{"name":"China University of Mining and Technology, Xuzhou, China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/P15-1034"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1027"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.emnlp-main.764"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.521"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1067"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/3331184.3331416"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P19-1470"},{"key":"ref8","doi-asserted-by":"crossref","DOI":"10.1109\/TKDE.2022.3224228","article-title":"Multi-modal knowledge graph construction and application: A survey","author":"Zhu","year":"2022"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.emnlp-main.291"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1145\/3394171.3413577"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1145\/3503161.3548427"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.findings-naacl.121"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.wnut-1.11"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/WACV45572.2020.9093614"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.acl-long.490"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i05.6363"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CAIA.1991.120841"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1186\/1471-2105-6-S1-S14"},{"issue":"1","key":"ref19","first-page":"65","article-title":"Mencius: A chinese named entity recognizer using the maximum entropy-based hybrid model","volume":"9","author":"Tsai","year":"2004","journal-title":"Int. J. Comput. Linguistics Chin. Lang. Process."},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICMLC.2006.258946"},{"key":"ref21","article-title":"Bidirectional LSTM-CRF models for sequence tagging","author":"Huang","year":"2015"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D17-1283"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.611"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.findings-acl.161"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N18-1078"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v32i1.11962"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2019.00061"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P18-1185"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.306"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1145\/3394171.3413650"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i15.17633"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i16.17687"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1145\/3503161.3548228"},{"key":"ref34","article-title":"A novel framework for multimodal named entity recognition with multi-level alignments","author":"Liu","year":"2023"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.findings-emnlp.473"},{"key":"ref36","first-page":"2055","article-title":"Flat multi-modal interaction transformer for named entity recognition","volume-title":"Proc. 29th Int. Conf. Comput. Linguistics","author":"Lu","year":"2022"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1145\/3488560.3498475"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/ICME52920.2022.9859972"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1016\/j.ipm.2023.103546"},{"key":"ref40","article-title":"Integrating large pre-trained models into multimodal named entity recognition with evidential fusion","author":"Liu","year":"2023"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1145\/3539597.3570485"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298990"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.142"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.330"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00611"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N18-1037"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.344"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00644"},{"key":"ref49","first-page":"5678","article-title":"Dual capsule attention mask network with mutual learning for visual question answering","volume-title":"Proc. 29th Int. Conf. Comput. Linguistics","author":"Tian","year":"2022"},{"key":"ref50","first-page":"5721","article-title":"Overcoming language priors in visual question answering via distinguishing superficially similar instances","volume-title":"Proc. 29th Int. Conf. Comput. Linguistics","author":"Wu","year":"2022"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01264-9_42"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01094"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00850"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W15-2812"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46454-1_24"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.3115\/1075096.1075150"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00377"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00636"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N16-1030"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1810.04805"},{"key":"ref61","article-title":"Decoupled weight decay regularization","volume-title":"Proc. 7th Int. Conf. Learn. Representations","author":"Loshchilov","year":"2019"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/p16-1101"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.coling-main.168"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.naacl-main.232"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i7.25971"}],"container-title":["IEEE Transactions on Artificial Intelligence"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9078688\/10571778\/10292546.pdf?arnumber=10292546","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,23]],"date-time":"2025-08-23T01:09:09Z","timestamp":1755911349000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10292546\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,6]]},"references-count":65,"journal-issue":{"issue":"6"},"URL":"https:\/\/doi.org\/10.1109\/tai.2023.3326416","relation":{},"ISSN":["2691-4581"],"issn-type":[{"value":"2691-4581","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,6]]}}}