{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,17]],"date-time":"2026-04-17T16:06:19Z","timestamp":1776441979385,"version":"3.51.2"},"reference-count":40,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,8,25]],"date-time":"2023-08-25T00:00:00Z","timestamp":1692921600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,8,25]],"date-time":"2023-08-25T00:00:00Z","timestamp":1692921600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,8,25]]},"DOI":"10.1109\/iciis58898.2023.10253560","type":"proceedings-article","created":{"date-parts":[[2023,9,20]],"date-time":"2023-09-20T17:37:40Z","timestamp":1695231460000},"page":"61-66","source":"Crossref","is-referenced-by-count":3,"title":["Sinhala-English Parallel Word Dictionary Dataset"],"prefix":"10.1109","author":[{"given":"Kasun","family":"Wickramasinghe","sequence":"first","affiliation":[{"name":"University of Moratuwa,Department of Computer Science &#x0026; Engineering,Moratuwa,Sri Lanka"}]},{"given":"Nisansa","family":"De Silva","sequence":"additional","affiliation":[{"name":"University of Moratuwa,Department of Computer Science &#x0026; Engineering,Moratuwa,Sri Lanka"}]}],"member":"263","reference":[{"key":"ref13","first-page":"3291","article-title":"Constraint-based bilingual lexicon induction for closely related languages","author":"nasution","year":"2016","journal-title":"LREC"},{"key":"ref35","article-title":"Im-plementing a corpus for sinhala language","author":"upeksha","year":"2015","journal-title":"Symposium on Language Technology for South Asia 2015"},{"key":"ref12","first-page":"846","article-title":"Analyzing methods for improving precision of pivot based bilingual dictionaries","author":"saralegi","year":"2011","journal-title":"EMNLP"},{"key":"ref34","article-title":"Sinhala text classification: observations from the perspective of a resource poor language","author":"de silva","year":"2015","journal-title":"ResearchGATE"},{"key":"ref15","first-page":"79","article-title":"A statistical approach to machine translation","volume":"16","author":"brown","year":"1990","journal-title":"Computational Linguistics"},{"key":"ref37","first-page":"2214","article-title":"Parallel data, tools and interfaces in OPUS","author":"tiedemann","year":"2012","journal-title":"LREC"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1145\/2723144"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-18422-7_7"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1162\/tacl_a_00051"},{"key":"ref30","first-page":"20","article-title":"Ensitip: a tool to unlock the english web","author":"wasala","year":"2008","journal-title":"11 th international conference on humans and computers Nagaoka University of Technology Japan"},{"key":"ref11","first-page":"1","article-title":"Exploiting bilingual lexicons to improve multilingual embedding-based document and sentence alignment for low-resource languages","author":"fernando","year":"2022","journal-title":"Knowledge and Information Systems"},{"key":"ref33","article-title":"Improving english to sinhala neural machine translation using part-of-speech tag","author":"perera","year":"2022","journal-title":"ArXiv Preprint"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.acl-long.62"},{"key":"ref32","article-title":"Bag of tricks for efficient text classification","author":"joulin","year":"2016","journal-title":"ArXiv Preprint"},{"key":"ref2","article-title":"A survey on recent approaches for natural language processing in low-resource scenarios","author":"hedderich","year":"2020","journal-title":"ArXiv Preprint"},{"key":"ref1","article-title":"Low-resource languages: A review of past work and future challenges","author":"magueresse","year":"2020","journal-title":"ArXiv Preprint"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W16-2369"},{"key":"ref39","first-page":"74","article-title":"Rouge: A package for automatic evaluation of summaries","author":"lin","year":"2004","journal-title":"Text Summarization Branches Out"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W16-2366"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.emnlp-main.365"},{"key":"ref19","article-title":"Neural machine translation by jointly learning to align and translate","author":"bahdanau","year":"2014","journal-title":"ArXiv Preprint"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W16-2365"},{"key":"ref24","first-page":"100","article-title":"Building a wordnet for sinhala","author":"wijesiri","year":"2014","journal-title":"Proceedings of the Seventh Global WordNet Conference"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1162\/tacl_a_00447"},{"key":"ref26","article-title":"No language left behind: Scaling human-centered machine translation","author":"costa-juss\u00e0","year":"2022","journal-title":"ArXiv Preprint"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1632"},{"key":"ref20","article-title":"Google's neural machine translation system: Bridging the gap between human and machine translation","author":"wu","year":"2016","journal-title":"ArXiv Preprint"},{"key":"ref22","article-title":"Data augmentation to address out-of-vocabulary problem in low-resource sinhala-english neural machine translation","author":"fernando","year":"2022","journal-title":"ArXiv Preprint"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/MERCon52712.2021.9525720"},{"key":"ref28","first-page":"4555","article-title":"Paracrawl: Web-scale acquisition of parallel corpora","author":"ba\u00f1\u00f3n","year":"2020","journal-title":"ACL"},{"key":"ref27","first-page":"124","article-title":"Automatic creation of a sentence aligned sinhala-tamil parallel corpus","author":"hameed","year":"0","journal-title":"Proceedings of the 6th Workshop on South and Southeast Asian Natural Language Processing (WSSANLP2016)"},{"key":"ref29","article-title":"Tamizhi-net ocr: Creating a quality large scale tamil-sinhala-english parallel corpus using deep learning based printed charac-ter recognition (pcr)","author":"vasantharajan","year":"2021","journal-title":"ArXiv Preprint"},{"key":"ref8","article-title":"Cross-lingual language model pretraining","volume":"32","author":"conneau","year":"2019","journal-title":"NIPS"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D18-1330"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.747"},{"key":"ref4","article-title":"Survey on publicly available sinhala natural language processing tools and research","author":"de silva","year":"2019","journal-title":"ArXiv Preprint"},{"key":"ref3","article-title":"Some languages are more equal than others: Probing deeper into the linguistic disparity in the nlp world","author":"ranathunga","year":"2022","journal-title":"ArXiv Preprint"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/N15-1104"},{"key":"ref5","article-title":"Exploiting similarities among languages for machine translation","author":"mikolov","year":"2013","journal-title":"ArXiv Preprint"},{"key":"ref40","first-page":"1874","article-title":"Word embedding evaluation for sinhala","author":"lakmal","year":"2020","journal-title":"LREC"}],"event":{"name":"2023 IEEE 17th International Conference on Industrial and Information Systems (ICIIS)","location":"Peradeniya, Sri Lanka","start":{"date-parts":[[2023,8,25]]},"end":{"date-parts":[[2023,8,26]]}},"container-title":["2023 IEEE 17th International Conference on Industrial and Information Systems (ICIIS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10253467\/10253461\/10253560.pdf?arnumber=10253560","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,10,9]],"date-time":"2023-10-09T18:10:22Z","timestamp":1696875022000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10253560\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,8,25]]},"references-count":40,"URL":"https:\/\/doi.org\/10.1109\/iciis58898.2023.10253560","relation":{},"subject":[],"published":{"date-parts":[[2023,8,25]]}}}