{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,4]],"date-time":"2026-05-04T10:05:31Z","timestamp":1777889131782,"version":"3.51.4"},"reference-count":49,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T00:00:00Z","timestamp":1760832000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T00:00:00Z","timestamp":1760832000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,10,19]]},"DOI":"10.1109\/iccv51701.2025.00508","type":"proceedings-article","created":{"date-parts":[[2026,4,29]],"date-time":"2026-04-29T19:45:49Z","timestamp":1777491949000},"page":"5348-5358","source":"Crossref","is-referenced-by-count":0,"title":["DAViD: Data-Efficient and Accurate Vision Models from Synthetic Data DAViD also references Michelangelo's David\u2014an iconic symbol of anatomical precision-and the David vs. Goliath story, reflecting our small yet powerful dataset and models."],"prefix":"10.1109","author":[{"given":"Fatemeh","family":"Saleh","sequence":"first","affiliation":[{"name":"Microsoft,Cambridge,UK"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sadegh","family":"Aliakbarian","sequence":"additional","affiliation":[{"name":"Microsoft,Cambridge,UK"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Charlie","family":"Hewitt","sequence":"additional","affiliation":[{"name":"Microsoft,Cambridge,UK"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lohit","family":"Petikam","sequence":"additional","affiliation":[{"name":"Microsoft,Cambridge,UK"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"family":"Xiao-Xian","sequence":"additional","affiliation":[{"name":"Microsoft,Cambridge,UK"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Antonio","family":"Criminisi","sequence":"additional","affiliation":[{"name":"Microsoft,Cambridge,UK"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Thomas","family":"J","sequence":"additional","affiliation":[{"name":"Microsoft,Cambridge,UK"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tadas","family":"Baltru\u0161aitis","sequence":"additional","affiliation":[{"name":"Microsoft,Cambridge,UK"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00843"},{"key":"ref2","article-title":"Richter, and Vladlen Koltun. Depth pro: Sharp monocular metric depth in less than a second","volume-title":"International Conference on Learning Representations","author":"Bochkovskii"},{"key":"ref3","first-page":"2","article-title":"Find: An unsupervised implicit 3d model of articulated human feet","volume-title":"British Machine Vision Conference (BMVC)","author":"Boyne"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2011.37"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.350"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"ref7","first-page":"4","article-title":"An image is worth 16\u00d716 words: Transformers for image recognition at scale","volume-title":"International Conference on Learning Representations","author":"Dosovitskiy"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01061"},{"key":"ref9","journal-title":"Renderpeople GmbH. Renderpeople"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01237"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1145\/3687772"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00423"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01256"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58545-7_12"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/WACV48630.2021.00159"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v36i1.19999"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-73235-5_12"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1145\/3474085.3475512"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00865"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1405.0312"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6832"},{"key":"ref22","first-page":"5","author":"Loshchilov","year":"2016","journal-title":"Sgdr: Stochastic gradient descent with warm restarts"},{"key":"ref23","first-page":"5","author":"Loshchilov","year":"2017","journal-title":"Decoupled weight decay regularization"},{"key":"ref24","first-page":"183","article-title":"Rapid acquisition of specular and diffuse normal maps from polarized spherical gradient illumination","volume-title":"Proceedings of the 18th Eurographics Conference on Rendering Techniques","author":"Ma"},{"key":"ref25","article-title":"Codec Avatar Studio: Paired Human Captures for Complete, Driveable, and Generalizable Avatars","author":"Martinez","year":"2024","journal-title":"NeurIPS Track on Datasets and Benchmarks"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/TSMC.2014.2331215"},{"key":"ref27","article-title":"DINOv2: Learning robust visual features without supervision","author":"Oquab","year":"2024","journal-title":"Transactions on Machine Learning Research"},{"key":"ref28","first-page":"2","article-title":"AGORA: Avatars in geography optimized for regression analysis. In Proceedings IEEE\/CVF Conf","volume-title":"on Computer Vision and Pattern Recognition (CVPR)","author":"Patel"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01123"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1145\/3681758.3697987"},{"key":"ref31","first-page":"8748","article-title":"Learning transferable visual models from natural language supervision","volume-title":"International conference on machine learning","author":"Radford"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2020.3019967"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2020.3019967"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01196"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1016\/j.imavis.2016.01.002"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1016\/j.imavis.2016.01.002"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00016"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00795"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-67558-9_28"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-018-1130-2"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00366"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01294"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00057"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.52202\/079017-0688"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.596"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.01855"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01632"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00569"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/WACV57701.2024.00411"}],"event":{"name":"2025 IEEE\/CVF International Conference on Computer Vision (ICCV)","location":"Honolulu, HI, USA","start":{"date-parts":[[2025,10,19]]},"end":{"date-parts":[[2025,10,25]]}},"container-title":["2025 IEEE\/CVF International Conference on Computer Vision (ICCV)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11443115\/11443287\/11444748.pdf?arnumber=11444748","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T05:07:16Z","timestamp":1777612036000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11444748\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,19]]},"references-count":49,"URL":"https:\/\/doi.org\/10.1109\/iccv51701.2025.00508","relation":{},"subject":[],"published":{"date-parts":[[2025,10,19]]}}}