{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,29]],"date-time":"2026-04-29T22:27:07Z","timestamp":1777501627148,"version":"3.51.4"},"reference-count":105,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"1","license":[{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100004410","name":"T\u00fcrkiye Bilimsel ve Teknolojik Ara\u015ft\u0131rma Kurumu","doi-asserted-by":"publisher","award":["116E445"],"award-info":[{"award-number":["116E445"]}],"id":[{"id":"10.13039\/501100004410","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Pattern Anal. Mach. Intell."],"published-print":{"date-parts":[[2023,1,1]]},"DOI":"10.1109\/tpami.2022.3143074","type":"journal-article","created":{"date-parts":[[2022,1,13]],"date-time":"2022-01-13T20:36:46Z","timestamp":1642106206000},"page":"1217-1232","source":"Crossref","is-referenced-by-count":50,"title":["Towards Zero-Shot Sign Language Recognition"],"prefix":"10.1109","volume":"45","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2811-3747","authenticated-orcid":false,"given":"Yunus Can","family":"Bilge","sequence":"first","affiliation":[{"name":"Graduate School of Science and Engineering, Hacettepe University, Ankara, Turkey"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0962-7101","authenticated-orcid":false,"given":"Ramazan Gokberk","family":"Cinbis","sequence":"additional","affiliation":[{"name":"Department of Computer Engineering, Middle East Technical University, Ankara, Turkey"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8644-2875","authenticated-orcid":false,"given":"Nazli","family":"Ikizler-Cinbis","sequence":"additional","affiliation":[{"name":"Computer Engineering Department, Hacettepe University, Ankara, Turkey"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref39","first-page":"291","article-title":"Watch, read and lookup: Learning to spot signs from multiple supervisors","author":"momeni","year":"2020","journal-title":"Proc Asian Conf Comput Vis"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58621-8_3"},{"key":"ref33","first-page":"1","article-title":"Large-scale learning of sign language by watching TV (using co-occurrences)","author":"pfister","year":"2013","journal-title":"Proc Brit Mach Vis Conf"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/TSMCB.2010.2065802"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206523"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2007.383346"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2019.2911077"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.364"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10599-4_52"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206599"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58621-8_40"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/WACV45572.2020.9093512"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2006.51"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/86.413199"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1007\/11550518_50"},{"key":"ref21","first-page":"165","article-title":"Machine recognition of auslan signs using powergloves: Towards large-lexicon recognition of sign language","author":"kadous","year":"1996","journal-title":"Proc Workshop Integration Gesture Lang Speech"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICSMC.1997.625742"},{"key":"ref23","first-page":"359","article-title":"Sign language recognition using boosted volumetric features","author":"cooper","year":"2007","journal-title":"Proc IAPR Conf Mach Vis Appl"},{"key":"ref101","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01004"},{"key":"ref100","first-page":"433","article-title":"Learning visual attributes","author":"ferrari","year":"2007","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1007\/s001380050080"},{"key":"ref50","first-page":"433","article-title":"Learning visual attributes","author":"ferrari","year":"2008","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref51","first-page":"3464","article-title":"Zero-shot recognition with unreliable attributes","author":"jayaraman","year":"2014","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46493-0_21"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298730"},{"key":"ref57","first-page":"1143","article-title":"Im2text: Describing images using 1 million captioned photographs","author":"ordonez","year":"2011","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2012.162"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10599-4_23"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2013.140"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2013.111"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2011.6126281"},{"key":"ref40","article-title":"Purdue RVL-SLLL american sign language database. school of electrical and computer engineering technical report","author":"wilbur","year":"2006","journal-title":"Technical Report TR-96&#x2013;1"},{"key":"ref4","author":"valli","year":"2000","journal-title":"Linguistics of American Sign Language An Introduction"},{"key":"ref3","first-page":"1","article-title":"Challenges in development of the american sign language lexicon video dataset (ASLLVD) corpus","author":"neidle","year":"2012","journal-title":"Proc 5th Workshop Representation Process Sign Languages Interact Between Corpus Lexicon Lang Resour Eval Conf"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00812"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1111\/j.1749-818X.2011.00304.x"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1016\/j.cviu.2015.09.013"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206772"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.332"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.5244\/C.30.136"},{"key":"ref46","first-page":"1911","article-title":"Extensions of the sign language recognition and translation corpus RWTH-PHOENIX-weather","author":"forster","year":"2014","journal-title":"Proc 9th Int Conf Lang Resour Eval"},{"key":"ref45","first-page":"1627","article-title":"Dynamic affine-invariant shape-appearance handshape features and classification in sign language videos","volume":"14","author":"roussos","year":"2013","journal-title":"J Mach Learn Res"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206594"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v32i1.11903"},{"key":"ref42","first-page":"1","article-title":"LSA64: An argentinian sign language dataset","author":"ronchetti","year":"2016","journal-title":"Proc Congreso Argentino de Ciencias de la Computaci&#x00F3;n"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/AFGR.2008.4813472"},{"key":"ref44","first-page":"1","article-title":"The devisign large vocabulary of chinese sign language database and baseline evaluations","author":"chai","year":"2014","journal-title":"Tech Rep VIPL-TR-14-SLR-001"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-73279-2_73"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP.2015.7350760"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.521"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2011.5995353"},{"key":"ref70","first-page":"4171","article-title":"BERT: Pre-training of deep bidirectional transformers for language understanding","author":"devlin","year":"2019","journal-title":"Proc Conf Assoc Comput Linguistics"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2627563"},{"key":"ref77","first-page":"1","article-title":"Action2vec: A crossmodal embedding approach to action learning","author":"hahn","year":"2018","journal-title":"Proc Brit Mach Vis Conf"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-016-0983-5"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-71249-9_6"},{"key":"ref78","first-page":"841","article-title":"Recognizing unfamiliar gestures for human-robot interaction through zero-shot learning","author":"thomason","year":"2016","journal-title":"Proc Int Symp Exp Robot"},{"key":"ref79","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR.2018.8545869"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2011.5995627"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.313"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.321"},{"key":"ref63","first-page":"4247","article-title":"Predicting deep zero-shot convolutional neural networks using textual descriptions","author":"lei ba","year":"2015","journal-title":"Proc IEEE Int Conf Comput Vis"},{"key":"ref64","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10605-2_38"},{"key":"ref65","first-page":"2152","article-title":"An embarrassingly simple approach to zero-shot learning","author":"romera-paredes","year":"2015","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.117"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.247"},{"key":"ref68","first-page":"3111","article-title":"Distributed representations of words and phrases and their compositionality","author":"mikolov","year":"2013","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1093\/deafed\/eni001"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1162"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1007\/3-540-46616-9_10"},{"key":"ref95","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2019.2929257"},{"key":"ref94","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1179"},{"key":"ref93","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.8.1735"},{"key":"ref92","doi-asserted-by":"publisher","DOI":"10.1016\/j.neunet.2005.06.042"},{"key":"ref105","first-page":"1","article-title":"Auto-encoding variational bayes","author":"kingma","year":"2014","journal-title":"Proc Int Conf Learn Representations"},{"key":"ref91","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"ref104","first-page":"214","article-title":"Wasserstein generative adversarial networks","author":"arjovsky","year":"2017","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref90","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.502"},{"key":"ref103","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58542-6_29"},{"key":"ref102","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00581"},{"key":"ref98","doi-asserted-by":"publisher","DOI":"10.1109\/TGRS.2017.2754648"},{"key":"ref99","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.473"},{"key":"ref96","first-page":"5998","article-title":"Attention is all you need","author":"vaswani","year":"2017","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref97","doi-asserted-by":"publisher","DOI":"10.1007\/s10994-010-5198-3"},{"key":"ref10","first-page":"1","article-title":"Sign language production using neural machine translation and generative adversarial networks","author":"stoll","year":"2018","journal-title":"Proc Brit Mach Vis Conf"},{"key":"ref11","first-page":"233","author":"lewis","year":"2015","journal-title":"Ethnologue Languages of the World"},{"key":"ref12","author":"valli","year":"2006","journal-title":"The Gallaudet Dictionary of American Sign Language"},{"key":"ref13","author":"brien","year":"1992","journal-title":"Dictionary of British Sign Language English"},{"key":"ref14","author":"johnston","year":"1998","journal-title":"Signs of Australia A New Dictionary of Auslan (Australian Sign Language)"},{"key":"ref15","first-page":"1","article-title":"MS-ASL: A large-scale data set and benchmark for understanding american sign language","author":"vaezi joze","year":"2019","journal-title":"Proc Brit Mach Vis Conf"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00718"},{"key":"ref82","first-page":"261","article-title":"Explaining models by propagating shapley values of local components","author":"chen","year":"2019","journal-title":"Proc AAAI Conf Artif Intell"},{"key":"ref17","first-page":"1","article-title":"Zero-shot sign language recognition: Can textual data uncover sign languages?","author":"bilge","year":"2019","journal-title":"Proc Brit Mach Vis Conf"},{"key":"ref81","first-page":"4768","article-title":"A unified approach to interpreting model predictions","author":"lundberg","year":"2017","journal-title":"Proc 31st Int Conf Neural Inf Process Syst"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1016\/0031-3203(88)90048-9"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01261-8_32"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1145\/2897735"},{"key":"ref83","first-page":"618","article-title":"Grad-CAM: Why did you say that? Visual explanations from deep networks via gradient-based localization","author":"selvaraju","year":"2017","journal-title":"Proc IEEE Int Conf Comput Vis"},{"key":"ref80","doi-asserted-by":"publisher","DOI":"10.1145\/2939672.2939778"},{"key":"ref89","author":"lucas","year":"2003","journal-title":"What&#x2019;s Your Sign for Pizza? An Introduction to Variation in American Sign Language"},{"key":"ref85","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2020.2975980"},{"key":"ref86","author":"costello","year":"1999","journal-title":"Random House Webster's Concise American Sign Language Dictionary"},{"key":"ref87","author":"tennant","year":"1998","journal-title":"The American Sign Language Handshape Dictionary"},{"key":"ref88","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.328"}],"container-title":["IEEE Transactions on Pattern Analysis and Machine Intelligence"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/34\/9970415\/09681230.pdf?arnumber=9681230","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,12,26]],"date-time":"2022-12-26T19:13:38Z","timestamp":1672082018000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9681230\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,1,1]]},"references-count":105,"journal-issue":{"issue":"1"},"URL":"https:\/\/doi.org\/10.1109\/tpami.2022.3143074","relation":{},"ISSN":["0162-8828","2160-9292","1939-3539"],"issn-type":[{"value":"0162-8828","type":"print"},{"value":"2160-9292","type":"electronic"},{"value":"1939-3539","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,1,1]]}}}