{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,7]],"date-time":"2026-03-07T18:22:25Z","timestamp":1772907745547,"version":"3.50.1"},"reference-count":67,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"name":"RIE2020 Industry Alignment Fund - Industry Collaboration Projects"},{"name":"Cash and in-kind contribution from the Industry Partner"},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["U1913602"],"award-info":[{"award-number":["U1913602"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001459","name":"Ministry of Education - Singapore","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001459","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Academic Research Fund Tier 2","award":["MOE T2EP20220 0007"],"award-info":[{"award-number":["MOE T2EP20220 0007"]}]},{"name":"Academic Research Fund Tier 2","award":["Tier 1 RG14\/22"],"award-info":[{"award-number":["Tier 1 RG14\/22"]}]},{"name":"Academic Research Fund Tier 2","award":["RG95\/20"],"award-info":[{"award-number":["RG95\/20"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Multimedia"],"published-print":{"date-parts":[[2024]]},"DOI":"10.1109\/tmm.2023.3309559","type":"journal-article","created":{"date-parts":[[2023,8,28]],"date-time":"2023-08-28T17:59:41Z","timestamp":1693245581000},"page":"3302-3316","source":"Crossref","is-referenced-by-count":8,"title":["ViTA: Video Transformer Adaptor for Robust Video Depth Estimation"],"prefix":"10.1109","volume":"26","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-0884-5126","authenticated-orcid":false,"given":"Ke","family":"Xian","sequence":"first","affiliation":[{"name":"S-Lab, Nanyang Technological University (NTU), Singapore"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5740-2682","authenticated-orcid":false,"given":"Juewen","family":"Peng","sequence":"additional","affiliation":[{"name":"Key Laboratory of Image Processing and Intelligent Control, Ministry of Education, School of Artificial Intelligence and Automation, Huazhong University of Science and Technology, Wuhan, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9223-1863","authenticated-orcid":false,"given":"Zhiguo","family":"Cao","sequence":"additional","affiliation":[{"name":"Key Laboratory of Image Processing and Intelligent Control, Ministry of Education, School of Artificial Intelligence and Automation, Huazhong University of Science and Technology, Wuhan, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9954-6294","authenticated-orcid":false,"given":"Jianming","family":"Zhang","sequence":"additional","affiliation":[{"name":"Adobe Research, San Francisco, CA, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0329-7458","authenticated-orcid":false,"given":"Guosheng","family":"Lin","sequence":"additional","affiliation":[{"name":"S-Lab, Nanyang Technological University (NTU), Singapore"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1145\/3386569.3392377"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00166"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1145\/3476576.3476728"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1145\/3306346.3323015"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01580"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2013.2283451"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2017.2748458"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.445"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2009.52"},{"key":"ref10","first-page":"41","article-title":"Nonrigid structure from motion in trajectory space","volume-title":"Proc. Adv. Neural Inform. Process. Syst.","author":"Akhter","year":"2008,"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2013.169"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2020.3019967"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00069"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00465"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00643"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01196"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00040"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00795"},{"key":"ref19","first-page":"2366","article-title":"Depth map prediction from a single image using a multi-scale deep network","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Eigen","year":"2014,"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2017.2740321"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-20870-7_41"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW53098.2021.00278"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2019.2941776"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.699"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.700"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2021.3091308"},{"key":"ref27","first-page":"730","article-title":"Single-image depth perception in the wild","volume-title":"Proc. Adv. Neural Inform. Process. Syst.","author":"Chen","year":"2016"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.179"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58536-5_24"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2019.2929202"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2021.3097396"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/3DV.2019.00046"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00181"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1145\/3474085.3475564"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/ICCVW54120.2021.00134"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1145\/3503161.3547978"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00880"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01778"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-021-01484-6"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2021.3136220"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.596"},{"key":"ref42","first-page":"1","article-title":"Deepv2d: Video to depth with differentiable structure from motion","volume-title":"Proc. Int. Conf. Learn. Represent.","author":"Teed","year":"2019"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2019.2912121"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2014.2316835"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00538"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2010.11929"},{"key":"ref47","first-page":"10347","article-title":"Training data-efficient image transformers & distillation through attention","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Touvron","year":"2021"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01596"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00392"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00476"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00320"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01332"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.2102.05095"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01419"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00612"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.207"},{"key":"ref59","first-page":"1","article-title":"IRS: A large synthetic indoor robotics stereo dataset for disparity and surface normal estimation","volume-title":"Proc. Int. Conf. Multimedia Expo","author":"Wang","year":"2021"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/IROS45743.2020.9341801"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1109\/IROS.2012.6385773"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-33715-4_54"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1109\/3DV.2017.00012"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-33783-3_44"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46484-8_45"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-11015-4_25"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00027"}],"container-title":["IEEE Transactions on Multimedia"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6046\/10384483\/10233038.pdf?arnumber=10233038","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,1]],"date-time":"2024-03-01T22:41:24Z","timestamp":1709332884000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10233038\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024]]},"references-count":67,"URL":"https:\/\/doi.org\/10.1109\/tmm.2023.3309559","relation":{},"ISSN":["1520-9210","1941-0077"],"issn-type":[{"value":"1520-9210","type":"print"},{"value":"1941-0077","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024]]}}}