{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,29]],"date-time":"2025-08-29T17:40:08Z","timestamp":1756489208144,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":22,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,4,18]],"date-time":"2024-04-18T00:00:00Z","timestamp":1713398400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,4,18]]},"DOI":"10.1145\/3603287.3651197","type":"proceedings-article","created":{"date-parts":[[2024,4,27]],"date-time":"2024-04-27T12:06:34Z","timestamp":1714219594000},"page":"278-283","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Toshakhana: A Multidimensional Panjabi Corpus in Gurmukhi Script"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0003-9222-8458","authenticated-orcid":false,"given":"Arvinder","family":"Kang","sequence":"first","affiliation":[{"name":"University of Mississippi, Oxford, Mississippi, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9632-6870","authenticated-orcid":false,"given":"Thai","family":"Le","sequence":"additional","affiliation":[{"name":"University of Mississippi, Oxford, Mississippi, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7645-674X","authenticated-orcid":false,"given":"Yixin","family":"Chen","sequence":"additional","affiliation":[{"name":"University of Mississippi, Oxford, Mississippi, USA"}]}],"member":"320","published-online":{"date-parts":[[2024,4,27]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"2017. Jagbani. https:\/\/jagbani.punjabkesari.in\/"},{"key":"e_1_3_2_1_2_1","unstructured":"2020. Punjabi-kavita.com. https:\/\/www.punjabi-kavita.com\/"},{"key":"e_1_3_2_1_3_1","unstructured":"2022. Ajitjalandhar.com. https:\/\/www.ajitjalandhar.com\/"},{"key":"e_1_3_2_1_4_1","unstructured":"2022. Punjabitribuneonline.com. https:\/\/www.punjabitribuneonline.com\/"},{"key":"e_1_3_2_1_5_1","volume-title":"Corpus Linguistics","author":"Baker Paul","year":"2003","unstructured":"Paul Baker, Andrew Hardie, Tony McEnery, and BD Jayaram. 2003. Constructing Corpora of South Asian Languages. In Corpus Linguistics 2003. Lancaster, UK."},{"key":"e_1_3_2_1_6_1","volume-title":"Punjabi: A Conginitive-descriptive Grammar","author":"Bhatia Tej K.","year":"1993","unstructured":"Tej K. Bhatia. 1993. Punjabi: A Conginitive-descriptive Grammar. Routledge, New York."},{"key":"e_1_3_2_1_7_1","unstructured":"Kulpreet Chilana. 2017. Punjabi Dictionary. https:\/\/apps.apple.com\/in\/app\/punjabi-dictionary\/id550017294"},{"volume-title":"South Asian Folklore: An Encyclopedia: Afghanistan","author":"Claus Peter J.","key":"e_1_3_2_1_8_1","unstructured":"Peter J. Claus. 2003. South Asian Folklore: An Encyclopedia: Afghanistan. Vol. 1. Routledge, New York."},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1080\/09739572.2017.1324385"},{"volume-title":"Linguistic Survey of India","author":"Grierson George Abraham","key":"e_1_3_2_1_10_1","unstructured":"George Abraham Grierson. 1916. Linguistic Survey of India. Vol. 9. Supt. Govt. Printing India, Calcutta. 607--806 pages."},{"key":"e_1_3_2_1_11_1","volume-title":"Proceedings of the Seventh International Conference on Language Resources and Evaluation (LREC'10)","author":"Jha Girish Nath","year":"2010","unstructured":"Girish Nath Jha. 2010. The TDIL Program and the Indian Langauge Corpora Intitiative (ILCI). In Proceedings of the Seventh International Conference on Language Resources and Evaluation (LREC'10). European Language Resources Association (ELRA), Valletta, Malta. http:\/\/www.lrec-conf.org\/proceedings\/lrec2010\/pdf\/874_Paper.pdf"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-32-9949-8_26"},{"volume-title":"The Making of Sikh Scripture","author":"Mann Gurinder Singh","key":"e_1_3_2_1_13_1","unstructured":"Gurinder Singh Mann. 2001. The Making of Sikh Scripture. Oxford University Press, New York."},{"key":"e_1_3_2_1_14_1","unstructured":"Central Institute of Indian Languages. 2019. A Gold Standard Punjabi Raw Text Corpus. https:\/\/data.ldcil.org\/a-gold-standard-punjabi-raw-text-corpus?search=punjabi&category_id=0"},{"key":"e_1_3_2_1_15_1","unstructured":"BBC News Punjabi. 2022. BBC News Punjabi. https:\/\/www.bbc.com\/punjabi"},{"volume-title":"The Indo-Aryan languages","author":"Shackle Christopher","key":"e_1_3_2_1_16_1","unstructured":"Christopher Shackle. 2003. The Indo-Aryan languages. Routledge, London, New York. 581--621 pages."},{"key":"e_1_3_2_1_17_1","volume-title":"The Language Divide in Punjab. South Asian Graduate Research Journal 4, 1","author":"Singh Atamjit","year":"1997","unstructured":"Atamjit Singh. 1997. The Language Divide in Punjab. South Asian Graduate Research Journal 4, 1 (1997)."},{"key":"e_1_3_2_1_18_1","unstructured":"Kulbir S. Thind. 2005. Unicode Gurmukhi Fonts and Information. https:\/\/www.gurbanifiles.net\/unicode\/index.htm"},{"key":"e_1_3_2_1_19_1","unstructured":"Kulbir S. Thind. 2006--03. Issues Regarding the Use of Unicode Gurmukhi fonts. http:\/\/https:\/\/www.gurbanifiles.net\/unicode\/unicode_issues.htm"},{"key":"e_1_3_2_1_20_1","unstructured":"Vibhijain. 2011. Countries Where Punjabi is Spoken. Wikimedia Commons. https:\/\/commons.wikimedia.org\/wiki\/File:Countries_where_Punjabi_is_spoken.png"},{"key":"e_1_3_2_1_21_1","unstructured":"Emma Williams. 2008--09. A Comparative Study of the Development of the Gurumukhi Script: From the Handwritten Manuscript to the Digital Typeface."},{"key":"e_1_3_2_1_22_1","unstructured":"WorldData. 2022. Geographical Distribution of Languages Worldwide. WorldData. https:\/\/www.worlddata.info\/languages\/index.php"}],"event":{"name":"ACM SE '24: 2024 ACM Southeast Conference","sponsor":["ACM Association for Computing Machinery"],"location":"Marietta GA USA","acronym":"ACM SE '24"},"container-title":["Proceedings of the 2024 ACM Southeast Conference on ZZZ"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3603287.3651197","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3603287.3651197","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,29]],"date-time":"2025-08-29T17:06:17Z","timestamp":1756487177000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3603287.3651197"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,4,18]]},"references-count":22,"alternative-id":["10.1145\/3603287.3651197","10.1145\/3603287"],"URL":"https:\/\/doi.org\/10.1145\/3603287.3651197","relation":{},"subject":[],"published":{"date-parts":[[2024,4,18]]},"assertion":[{"value":"2024-04-27","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}