{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T01:15:52Z","timestamp":1740100552991,"version":"3.37.3"},"reference-count":24,"publisher":"IEEE","license":[{"start":{"date-parts":[[2022,2,21]],"date-time":"2022-02-21T00:00:00Z","timestamp":1645401600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2022,2,21]],"date-time":"2022-02-21T00:00:00Z","timestamp":1645401600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100003696","name":"Electronics and Telecommunications Research Institute","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100003696","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022,2,21]]},"DOI":"10.1109\/icaiic54071.2022.9722699","type":"proceedings-article","created":{"date-parts":[[2022,3,1]],"date-time":"2022-03-01T20:41:38Z","timestamp":1646167298000},"page":"087-091","source":"Crossref","is-referenced-by-count":0,"title":["Performance Improvement Method of the Video Visual Relation Detection with Multi-modal Feature Fusion"],"prefix":"10.1109","author":[{"given":"Kwang-Ju","family":"Kim","sequence":"first","affiliation":[{"name":"Electronics and Telecommunications Research Institute,Daegu,Korea,42994"}]},{"given":"Pyong-Kun","family":"Kim","sequence":"additional","affiliation":[{"name":"Electronics and Telecommunications Research Institute,Daegu,Korea,42994"}]},{"given":"Kil-Taek","family":"Lim","sequence":"additional","affiliation":[{"name":"Electronics and Telecommunications Research Institute,Daegu,Korea,42994"}]},{"given":"Jong Taek","family":"Lee","sequence":"additional","affiliation":[{"name":"Electronics and Telecommunications Research Institute,Daegu,Korea,42994"}]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1145\/3323873.3325056"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1145\/3343031.3356076"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0816-y"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.52"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.175"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.316"},{"article-title":"Seq-nms for video object detection","year":"2016","author":"han","key":"ref16"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.330"},{"key":"ref18","first-page":"379","article-title":"R-fcn: Object detection via regionbased fully convolutional networks","author":"dai","year":"2016","journal-title":"Advances in neural information processing systems"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2019.2910529"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00318"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2019.2939201"},{"key":"ref6","article-title":"Context-aware visual policy network for fine-grained image captioning","author":"zha","year":"2019","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2018.09.090"},{"key":"ref8","first-page":"766","article-title":"Video summarization with long short-term memory","author":"zhang","year":"2016","journal-title":"European Conference on Computer Vision"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/WACV.2019.00048"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2019.11.023"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2020.01.085"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TSMC.2017.2680404"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1145\/3123266.3123380"},{"article-title":"Efficient estimation of word representations in vector space","year":"2013","author":"mikolov","key":"ref22"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01067"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICME.2017.8019391"},{"key":"ref23","first-page":"852","article-title":"Visual relationship detection with language priors","author":"lu","year":"2016","journal-title":"European Conference on Computer Vision"}],"event":{"name":"2022 International Conference on Artificial Intelligence in Information and Communication (ICAIIC)","start":{"date-parts":[[2022,2,21]]},"location":"Jeju Island, Korea, Republic of","end":{"date-parts":[[2022,2,24]]}},"container-title":["2022 International Conference on Artificial Intelligence in Information and Communication (ICAIIC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9722611\/9722613\/09722699.pdf?arnumber=9722699","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,6,20]],"date-time":"2022-06-20T21:21:01Z","timestamp":1655760061000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9722699\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,2,21]]},"references-count":24,"URL":"https:\/\/doi.org\/10.1109\/icaiic54071.2022.9722699","relation":{},"subject":[],"published":{"date-parts":[[2022,2,21]]}}}