{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,25]],"date-time":"2026-04-25T14:40:29Z","timestamp":1777128029044,"version":"3.51.4"},"reference-count":76,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62072112"],"award-info":[{"award-number":["62072112"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"National Key R&amp;D Program of China","award":["2020AAA0108301"],"award-info":[{"award-number":["2020AAA0108301"]}]},{"name":"Scientific and Technological Innovation Action Plan of Shanghai Science and Technology Committee","award":["22511101502"],"award-info":[{"award-number":["22511101502"]}]},{"name":"Scientific and Technological Innovation Action Plan of Shanghai Science and Technology Committee","award":["21DZ2203300"],"award-info":[{"award-number":["21DZ2203300"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Multimedia"],"published-print":{"date-parts":[[2023]]},"DOI":"10.1109\/tmm.2022.3225720","type":"journal-article","created":{"date-parts":[[2022,12,1]],"date-time":"2022-12-01T00:21:26Z","timestamp":1669854086000},"page":"7710-7725","source":"Crossref","is-referenced-by-count":7,"title":["Dual Cross-Attention for Video Object Segmentation via Uncertainty Refinement"],"prefix":"10.1109","volume":"25","author":[{"given":"Jiahao","family":"Hong","sequence":"first","affiliation":[{"name":"Shanghai Key Laboratory of Intelligent Information Processing, School of Computer Science, Fudan University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2358-8543","authenticated-orcid":false,"given":"Wei","family":"Zhang","sequence":"additional","affiliation":[{"name":"Shanghai Key Laboratory of Intelligent Information Processing, School of Computer Science, Fudan University, Shanghai, China"}]},{"given":"Zhiwei","family":"Feng","sequence":"additional","affiliation":[{"name":"Shanghai Key Laboratory of Intelligent Information Processing, School of Computer Science, Fudan University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3339-8751","authenticated-orcid":false,"given":"Wenqiang","family":"Zhang","sequence":"additional","affiliation":[{"name":"Shanghai Key Laboratory of Intelligent Information Processing, School of Computer Science, Fudan University, Shanghai, China"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.79"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2020.3037461"},{"key":"ref3","article-title":"MOT16: A benchmark for multi-object tracking","author":"Milan","year":"2016"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.565"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.5244\/C.31.116"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-20870-7_35"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00626"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2018.2838670"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01237-3_4"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.238"},{"key":"ref11","first-page":"325","article-title":"MaskRNN: Instance level video object segmentation","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"2017","author":"Hu","year":"2017"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.372"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00971"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58558-7_20"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00542"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58580-8_39"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00770"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00932"},{"key":"ref19","first-page":"3430","article-title":"Video object segmentation with adaptive feature bank and uncertain-region refinement","volume-title":"Proc. 34th Int. Conf. Neural Inf. Process. Syst","author":"Liang","year":"2020"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58607-2_43"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58542-6_38"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00135"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00413"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00134"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00953"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00794"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2019.2918730"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00125"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00680"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.790"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00142"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00940"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58536-5_46"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00743"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2021.3081597"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00890"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00551"},{"key":"ref38","first-page":"11781","article-title":"Rethinking space-time networks with improved memory coverage for efficient video object segmentation","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"34","author":"Cheng","year":"2021"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01656"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01265"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01038"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00823"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2020.3013717"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/TCYB.2020.2992433"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.336"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00916"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.480"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01228-1_36"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2018.2890361"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00412"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00488"},{"key":"ref52","first-page":"5998","article-title":"Attention is all you need","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Vaswani","year":"2017"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P19-1285"},{"key":"ref54","first-page":"4171","article-title":"BERT: Pre-training of deep bidirectional transformers for language understanding","volume-title":"Proc. NAACL-HLT","author":"Kenton","year":"2019"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00813"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01009"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00033"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00585"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00930"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00982"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00863"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01234-2_1"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46493-0_38"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58520-4_26"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.85"},{"key":"ref67","article-title":"The 2017 DAVIS challenge on video object segmentation","author":"Pont-Tuset"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10602-1_48"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2014.2345401"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-009-0275-4"},{"key":"ref71","article-title":"Adam: A method for stochastic optimization","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Kingma","year":"2015"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00661"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00408"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01228-1_36"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00698"},{"key":"ref76","article-title":"BoLTVOS: Box-level tracking for video object segmentation","author":"Voigtlaender","year":"2019"}],"container-title":["IEEE Transactions on Multimedia"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6046\/10016790\/09966825.pdf?arnumber=9966825","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,12,20]],"date-time":"2023-12-20T00:12:12Z","timestamp":1703031132000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9966825\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023]]},"references-count":76,"URL":"https:\/\/doi.org\/10.1109\/tmm.2022.3225720","relation":{},"ISSN":["1520-9210","1941-0077"],"issn-type":[{"value":"1520-9210","type":"print"},{"value":"1941-0077","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023]]}}}