{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,26]],"date-time":"2026-03-26T16:43:32Z","timestamp":1774543412381,"version":"3.50.1"},"reference-count":107,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62176139"],"award-info":[{"award-number":["62176139"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62106128"],"award-info":[{"award-number":["62106128"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62176141"],"award-info":[{"award-number":["62176141"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100007129","name":"Natural Science Foundation of Shandong Province","doi-asserted-by":"publisher","award":["ZR2021ZD15"],"award-info":[{"award-number":["ZR2021ZD15"]}],"id":[{"id":"10.13039\/501100007129","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100007129","name":"Natural Science Foundation of Shandong Province","doi-asserted-by":"publisher","award":["ZR2021QF001"],"award-info":[{"award-number":["ZR2021QF001"]}],"id":[{"id":"10.13039\/501100007129","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Young Elite Scientists Sponsorship Program","award":["2021QNRC001"],"award-info":[{"award-number":["2021QNRC001"]}]},{"name":"Open Project of Key Laboratory of Artificial Intelligence, Ministry of Education"},{"name":"Shandong Provincial Natural Science Foundation for Distinguished Young Scholars","award":["ZR2021JQ26"],"award-info":[{"award-number":["ZR2021JQ26"]}]},{"DOI":"10.13039\/501100010040","name":"Taishan Scholar Project of Shandong Province","doi-asserted-by":"publisher","award":["tsqn202103088"],"award-info":[{"award-number":["tsqn202103088"]}],"id":[{"id":"10.13039\/501100010040","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100004733","name":"Universidade de Macau","doi-asserted-by":"publisher","award":["SKL-IoTSC(UM)-2021-2023\/ORP\/GA05\/2022"],"award-info":[{"award-number":["SKL-IoTSC(UM)-2021-2023\/ORP\/GA05\/2022"]}],"id":[{"id":"10.13039\/501100004733","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100006469","name":"Fundo para o Desenvolvimento das Ci\u00eancias e da Tecnologia","doi-asserted-by":"publisher","award":["0154\/2022\/A3"],"award-info":[{"award-number":["0154\/2022\/A3"]}],"id":[{"id":"10.13039\/501100006469","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100006469","name":"Fundo para o Desenvolvimento das Ci\u00eancias e da Tecnologia","doi-asserted-by":"publisher","award":["SKL-IOTSC(UM)-2021-2023"],"award-info":[{"award-number":["SKL-IOTSC(UM)-2021-2023"]}],"id":[{"id":"10.13039\/501100006469","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100006469","name":"Fundo para o Desenvolvimento das Ci\u00eancias e da Tecnologia","doi-asserted-by":"publisher","award":["MYRG-CRG2022-00013-IOTSC-ICI"],"award-info":[{"award-number":["MYRG-CRG2022-00013-IOTSC-ICI"]}],"id":[{"id":"10.13039\/501100006469","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Multimedia"],"published-print":{"date-parts":[[2024]]},"DOI":"10.1109\/tmm.2023.3303712","type":"journal-article","created":{"date-parts":[[2023,8,11]],"date-time":"2023-08-11T17:27:26Z","timestamp":1691774846000},"page":"8297-8311","source":"Crossref","is-referenced-by-count":9,"title":["Relational Network via Cascade CRF for Video Language Grounding"],"prefix":"10.1109","volume":"26","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8163-3050","authenticated-orcid":false,"given":"Tong","family":"Zhang","sequence":"first","affiliation":[{"name":"School of Software, Shandong University, Jinan, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9543-6960","authenticated-orcid":false,"given":"Xiankai","family":"Lu","sequence":"additional","affiliation":[{"name":"School of Software, Shandong University, Jinan, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2725-6458","authenticated-orcid":false,"given":"Hao","family":"Zhang","sequence":"additional","affiliation":[{"name":"School of Computer Science and Engineering, Nanyang Technological University, Singapore"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9644-9723","authenticated-orcid":false,"given":"Xiushan","family":"Nie","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, Shandong Jianzhu University, Jinan, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8465-1294","authenticated-orcid":false,"given":"Yilong","family":"Yin","sequence":"additional","affiliation":[{"name":"School of Software, Shandong University, Jinan, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2656-3082","authenticated-orcid":false,"given":"Jianbing","family":"Shen","sequence":"additional","affiliation":[{"name":"SKL-IOTSC, University of Macau, Macau, China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2021.3092579"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2018.2875363"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2019.2943204"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2018.2866370"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2022.3181116"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2021.3127346"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2022.3183586"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2021.3075242"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2023.3258628"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1007\/s13735-022-00264-3"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2022.3218656"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2022.3204623"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1145\/3474085.3475598"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1145\/3477180"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.563"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.618"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00279"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00418"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.585"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2021.3120545"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01186"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D18-1015"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6897"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33019062"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2020.3038993"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00134"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6984"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00225"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00155"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6627"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/WACV45572.2020.9093328"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01082"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33019159"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01030"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2018\/143"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00695"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1145\/3394171.3414026"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v36i2.20059"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.emnlp-main.324"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.emnlp-main.327"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01108"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6984"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2021.3052086"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i4.16406"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1145\/3543857"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2021.3090521"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1145\/3240508.3240549"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33018199"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/WACV.2019.00032"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1145\/3343031.3350879"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01017"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00042"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33018393"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2021.3086591"},{"key":"ref55","first-page":"1984","article-title":"ExCL: Extractive clip localization using natural language descriptions","volume-title":"Proc. Conf. Empir. Methods Natural Lang. Process.","author":"Ghosh","year":"2019"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2021.3060449"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW54120.2021.00361"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.findings-acl.69"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P19-1336"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.577"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1145\/3394171.3413967"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1109\/tmm.2022.3228167"},{"key":"ref63","first-page":"1481","article-title":"WSLLN: Weakly supervised natural language localization networks","volume-title":"Proc. Conf. Empir. Methods Natural Lang. Process.","author":"Gao","year":"2019"},{"key":"ref64","article-title":"Look closer to ground better: Weakly-supervised temporal grounding of sentence in video","author":"Chen","year":"2020"},{"key":"ref65","first-page":"18123","article-title":"Counterfactual contrastive learning for weakly-supervised vision-language grounding","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Zhang","year":"2020"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1145\/3474085.3475278"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2021.3058614"},{"key":"ref68","first-page":"3063","article-title":"Weakly supervised dense event captioning in videos","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Duan","year":"2018"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6820"},{"key":"ref70","article-title":"Weakly-supervised multi-level attentional reconstruction network for grounding textual queries in videos","author":"Song","year":"2020"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.2005.1555942"},{"key":"ref72","volume-title":"Probabilistic Graphical Models: Principles and Techniques","author":"Koller","year":"2009"},{"key":"ref73","article-title":"Graph attention networks","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Velikovi","year":"2017"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.1109\/TNN.2008.2005605"},{"key":"ref75","first-page":"2014","article-title":"Learning convolutional neural networks for graphs","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Niepert","year":"2016"},{"key":"ref76","article-title":"Semi-supervised classification with graph convolutional networks","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Kipf","year":"2017"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2003.1233908"},{"key":"ref78","first-page":"109","article-title":"Efficient inference in fully connected CRFs with Gaussian edge potentials","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Krhenbhl","year":"2011"},{"key":"ref79","first-page":"169.1","article-title":"Convolutional CRFs for semantic segmentation","volume-title":"Proc. Brit. Mach. Vis. Conf.","author":"Teichmann","year":"2019"},{"key":"ref80","first-page":"7689","article-title":"Joint modeling of visual objects and relations for scene graph generation","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Xu","year":"2021"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00933"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00052"},{"key":"ref83","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00418"},{"key":"ref84","first-page":"282","article-title":"Conditional random fields: Probabilistic models for segmenting and labeling sequence data","volume-title":"Proc. 18th Int. Conf. Mach. Learn.","author":"Lafferty","year":"2001"},{"key":"ref85","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.179"},{"key":"ref86","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00024"},{"key":"ref87","doi-asserted-by":"publisher","DOI":"10.1145\/3292500.3330888"},{"key":"ref88","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58452-8_5"},{"key":"ref89","first-page":"316","article-title":"CRF-CNN: Modeling structured information in human pose estimation","volume-title":"Proc. 30th Int. Conf. Neural Inf. Process. Syst.","author":"Chu","year":"2016"},{"key":"ref90","article-title":"Hadamard product for low-rank bilinear pooling","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Kim","year":"2017"},{"key":"ref91","first-page":"361","article-title":"Deeply learning the messages in message passing inference","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Lin","year":"2015"},{"key":"ref92","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2017\/558"},{"key":"ref93","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46448-0_31"},{"key":"ref94","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.502"},{"key":"ref95","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.83"},{"key":"ref96","doi-asserted-by":"publisher","DOI":"10.1145\/3331184.3331235"},{"key":"ref97","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.510"},{"key":"ref98","doi-asserted-by":"publisher","DOI":"10.1162\/tacl_a_00207"},{"key":"ref99","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-33718-5_11"},{"key":"ref100","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.493"},{"key":"ref101","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1810.04805"},{"key":"ref102","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1162"},{"key":"ref103","article-title":"Empirical evaluation of gated recurrent neural networks on sequence modeling","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Chung","year":"2014"},{"key":"ref104","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00155"},{"key":"ref105","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v36i3.20163"},{"key":"ref106","doi-asserted-by":"publisher","DOI":"10.1145\/3503161.3547782"},{"key":"ref107","doi-asserted-by":"publisher","DOI":"10.1162\/neco.2006.18.7.1527"}],"container-title":["IEEE Transactions on Multimedia"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6046\/10384483\/10214636.pdf?arnumber=10214636","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,2]],"date-time":"2024-08-02T08:08:40Z","timestamp":1722586120000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10214636\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024]]},"references-count":107,"URL":"https:\/\/doi.org\/10.1109\/tmm.2023.3303712","relation":{},"ISSN":["1520-9210","1941-0077"],"issn-type":[{"value":"1520-9210","type":"print"},{"value":"1941-0077","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024]]}}}