{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,27]],"date-time":"2026-03-27T17:11:20Z","timestamp":1774631480642,"version":"3.50.1"},"reference-count":42,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2021,6,4]],"date-time":"2021-06-04T00:00:00Z","timestamp":1622764800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,6,4]],"date-time":"2021-06-04T00:00:00Z","timestamp":1622764800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100001409","name":"Department of Science and Technology, Ministry of Science and Technology","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001409","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Speech Technol"],"published-print":{"date-parts":[[2021,12]]},"DOI":"10.1007\/s10772-021-09860-w","type":"journal-article","created":{"date-parts":[[2021,6,4]],"date-time":"2021-06-04T11:03:10Z","timestamp":1622804590000},"page":"853-864","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":39,"title":["Part-of-speech (POS) tagging using conditional random field (CRF) model for Khasi corpora"],"prefix":"10.1007","volume":"24","author":[{"given":"Sunita","family":"Warjri","sequence":"first","affiliation":[]},{"given":"Partha","family":"Pakray","sequence":"additional","affiliation":[]},{"given":"Saralin A.","family":"Lyngdoh","sequence":"additional","affiliation":[]},{"given":"Arnab Kumar","family":"Maji","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2021,6,4]]},"reference":[{"key":"9860_CR1","unstructured":"Agarwal, H., & Mani, A. (2006). Part of speech tagging and chunking with conditional random fields. In the Proceedings of NWAI workshop."},{"issue":"3","key":"9860_CR2","first-page":"3","volume":"3","author":"A Ahmad","year":"2014","unstructured":"Ahmad, A., & Syam, B. (2014). Kashmir part of speech tagger using CRF. Computer Science, 3(3), 3.","journal-title":"Computer Science"},{"key":"9860_CR3","doi-asserted-by":"publisher","unstructured":"Barman, A. K., Sarmah, J., & Sarma, S. K. (2013). POS Tagging of Assamese language and performance analysis of CRF++ and fnTBL approaches. In: 2013 UKSim 15th international conference on computer modelling and simulation IEEE, pp. 476\u2013479. Retrieved from https:\/\/doi.org\/10.1109\/UKSim.2013.91.","DOI":"10.1109\/UKSim.2013.91"},{"issue":"1","key":"9860_CR4","first-page":"18","volume":"17","author":"P Behera","year":"2017","unstructured":"Behera, P. (2017). An experiment with the CRF++ parts of speech (POS) tagger for Odia. Language in India, 17(1), 18.","journal-title":"Language in India"},{"key":"9860_CR5","doi-asserted-by":"publisher","unstructured":"Brants, T. (2000). TnT: A statistical part-of-speech tagger. Sixth Applied Natural Language Processing Conference (Association for Computational Linguistics, Seattle, Washington, USA), (pp. 224\u2013231). https:\/\/doi.org\/10.3115\/974147.974178.","DOI":"10.3115\/974147.974178"},{"issue":"17","key":"9860_CR6","doi-asserted-by":"publisher","first-page":"26","DOI":"10.5120\/7442-0452","volume":"48","author":"S Br","year":"2012","unstructured":"Br, S., & Ramakanth Kumar, P. (2012). Kannada part-of-speech tagging with probabilistic classifiers. International Journal of Computer Applications, 48(17), 26.","journal-title":"International Journal of Computer Applications"},{"key":"9860_CR7","unstructured":"CLE. (2020). Center for language engineering. Retrieved January 12, 2020, from https:\/\/www.cle.org.pk\/"},{"key":"9860_CR8","doi-asserted-by":"publisher","first-page":"133","DOI":"10.3115\/974499.974523","volume":"6","author":"D Cutting","year":"1992","unstructured":"Cutting, D., Kupiec, J., Pedersen, J., & Sibun, P. (1992). A practical part-of-speech tagger. Third Conference on Applied Natural Language Processing, 6, 133\u2013140.","journal-title":"Third Conference on Applied Natural Language Processing"},{"key":"9860_CR9","unstructured":"Ekbal, A., Haque, R., & Bandyopadhyay, S. (2007). Bengali part of speech tagging using conditional random field. In Proceedings of seventh international symposium on natural language processing (SNLP2007), (pp. 131\u2013136)."},{"key":"9860_CR10","first-page":"2938","volume":"2","author":"B Jawaid","year":"2014","unstructured":"Jawaid, B., Kamran, A., & Bojar, O. (2014). A tagged corpus and a tagger for Urdu. LREC, 2, 2938\u20132943.","journal-title":"LREC"},{"issue":"3","key":"9860_CR11","doi-asserted-by":"publisher","first-page":"331","DOI":"10.1007\/s10579-018-9439-6","volume":"53","author":"W Khan","year":"2019","unstructured":"Khan, W., Daud, A., Nasir, J. A., Amjad, T., Arafat, S., Aljohani, N., et al. (2019). Urdu part of speech tagging using conditional random fields. Language Resources and Evaluation, 53(3), 331.","journal-title":"Language Resources and Evaluation"},{"key":"9860_CR12","doi-asserted-by":"publisher","unstructured":"Krishnapriya, V., Sreesha, P., Harithalakshmi, T., Archana, T., & Vettath, J. N. (2014). Design of a POS tagger using conditional random fields for Malayalam. In 2014 first international conference on computational systems and communications (ICCSC) IEEE, (pp. 370\u2013373). https:\/\/doi.org\/10.1109\/COMPSC.2014.7032680.","DOI":"10.1109\/COMPSC.2014.7032680"},{"key":"9860_CR13","unstructured":"Lafferty, J., McCallum, A., & Pereira, F. C. (2001). Conditional random fields: Probabilistic models for segmenting and labeling sequence data. In proceedings of the eighteenth international conference on machine learning, (pp. 282\u2013289)"},{"key":"9860_CR14","unstructured":"Mawphor. (2017). Mawphor. Retrieved November 2017, June 2019, from https:\/\/www.mawphor.com\/index.php\/"},{"issue":"2","key":"9860_CR15","first-page":"155","volume":"20","author":"B Merialdo","year":"1994","unstructured":"Merialdo, B. (1994). Tagging English text with a probabilistic model. Computational Linguistics, 20(2), 155.","journal-title":"Computational Linguistics"},{"key":"9860_CR16","unstructured":"Ojha, A. K., Behera, P., Singh, S., & Jha, G. N. (2015). Training & evaluation of pos taggers in indo-aryan languages: A case of Hindi, Odia and Bhojpuri. In the proceedings of 7th language & technology conference: human language technologies as a challenge for computer science and linguistics, (pp. 524\u2013529)."},{"key":"9860_CR17","doi-asserted-by":"publisher","unstructured":"Pallavi, K., & Pillai, A. S. (2016). Kannpos-Kannada parts of speech tagger using conditional random fields. In: Emerging research in computing, information, communication and applications. Springer (pp. 479\u2013491). Retrieved from https:\/\/doi.org\/10.1007\/978-81-322-2553-9_43.","DOI":"10.1007\/978-81-322-2553-9_43"},{"key":"9860_CR18","doi-asserted-by":"publisher","first-page":"11","DOI":"10.1007\/978-3-642-00831-3_2","volume-title":"Computer processing of oriental languages. Language technology for the knowledge-based economy","author":"SL Pandian","year":"2009","unstructured":"Pandian, S. L., & Geetha, T. V. (2009). CRF models for Tamil part of speech tagging and chunking. In W. Li & D. Moll\u00e1-Aliod (Eds.), Computer processing of oriental languages. Language technology for the knowledge-based economy (pp. 11\u201322). Berlin: Springer."},{"key":"9860_CR19","unstructured":"Patel, C., & Gali, K. (2008). Part-of-speech tagging for Gujarati using conditional random fields. In: Proceedings of the IJCNLP-08 workshop on NLP for less privileged languages. Retrieved from https:\/\/www.aclweb.org\/anthology\/I08-3019."},{"key":"9860_CR20","first-page":"21","volume":"21","author":"A Pvs","year":"2007","unstructured":"Pvs, A., & Karthik, G. (2007). Part-of-speech tagging and chunking using conditional random fields and transformation based learning. Shallow Parsing for South Asian Languages, 21, 21.","journal-title":"Shallow Parsing for South Asian Languages"},{"key":"9860_CR21","doi-asserted-by":"publisher","first-page":"14","DOI":"10.5120\/ijca2016909684","volume":"142","author":"SK Sharma","year":"2016","unstructured":"Sharma, S. K. (2016). Assigning the correct word class to Punjabi unknown words using CRF. International Journal of Computer Applications, 142, 14. https:\/\/doi.org\/10.5120\/ijca2016909684.","journal-title":"International Journal of Computer Applications"},{"key":"9860_CR22","unstructured":"Singh, T. D., & Ekbal, A. (2008). Manipuri POS tagging using CRF and SVM: A language independent approach. In proceeding of 6th international conference on natural language processing (ICON-2008), (pp. 240\u2013245)"},{"key":"9860_CR23","doi-asserted-by":"publisher","unstructured":"Suraksha, N., Reshma, K., & Kumar, K. S. (2017). Part-of-speech tagging and parsing of Kannada text using Conditional Random Fields (CRFs). In: 2017 international conference on intelligent computing and control (I2C2) IEEE, (pp. 1\u20135). Retrieved from https:\/\/doi.org\/10.1109\/I2C2.2017.8321833.","DOI":"10.1109\/I2C2.2017.8321833"},{"key":"9860_CR24","unstructured":"Tham, M. J. (2018). Challenges and Issues in Developing an Annotated Corpus and HMM POS Tagger for Khasi. In the 15th international conference on natural language processing, (pp. 10\u201319)."},{"key":"9860_CR25","unstructured":"Warjri, S. (2020). Khasi corpus. Retrieved from https:\/\/github.com\/sunitawarjri\/Khasi-Corpus\/blob\/master\/Khasi%20Corpus.txt."},{"key":"9860_CR26","doi-asserted-by":"crossref","unstructured":"Warjri, S., Pakray, P., Lyngdoh, S., & Maji, A. K. (2021). Adopting conditional random field (CRF) for Khasi part-of-speech tagging (KPOST). In proceedings of the international conference on computing and communication systems: I3CS 2020, NEHU, Shillong, India, vol. 170 (Springer Nature), vol. 170, p. 75.","DOI":"10.1007\/978-981-33-4084-8_8"},{"issue":"1","key":"9860_CR27","first-page":"109","volume":"1","author":"S Warjri","year":"2018","unstructured":"Warjri, S., Pakray, P., Lyngdoh, S., & Kumar Maji, A. (2018). Khasi language as dominant part-of-speech (POS) ascendant in NLP. International Journal of Computational Intelligence & IoT, 1(1), 109.","journal-title":"International Journal of Computational Intelligence & IoT"},{"issue":"3","key":"9860_CR28","doi-asserted-by":"publisher","first-page":"795","DOI":"10.13053\/CyS-23-3-3248","volume":"23","author":"S Warjri","year":"2019","unstructured":"Warjri, S., Pakray, P., Lyngdoh, S., & Maji, A. K. (2019). Identification of POS Tag for Khasi Language based on Hidden Markov Model POS Tagger. Computaci\u00f3n y Sistemas, 23(3), 795. https:\/\/doi.org\/10.13053\/CyS-23-3-3248.","journal-title":"Computaci\u00f3n y Sistemas"},{"key":"9860_CR29","unstructured":"Wikipedia contributors. (2020a). Bengali language: Wikipedia, the free encyclopedia. Retrieved February 02, 2020, from https:\/\/en.wikipedia.org\/w\/index.php?title=Bengali-language&oldid=941772762."},{"key":"9860_CR30","unstructured":"Wikipedia contributors. (2020b). Assamese language: Wikipedia, the free encyclopedia. Retrieved February 02, 2020, from https:\/\/en.wikipedia.org\/w\/index.php?title=Assamese-language&oldid=939154061."},{"key":"9860_CR31","unstructured":"Wikipedia contributors. (2020c). Gujarati language: Wikipedia, the free encyclopedia. Retrieved February 03, 2020, from https:\/\/en.wikipedia.org\/w\/index.php?title=Gujarati-language&oldid=942374083"},{"key":"9860_CR32","unstructured":"Wikipedia contributors. (2020d). Kannada: Wikipedia, the free encyclopedia. Retrieved February 05, 2020, from https:\/\/en.wikipedia.org\/w\/index.php?title=Kannada&oldid=942703407."},{"key":"9860_CR33","unstructured":"Wikipedia contributors. (2020e). Kashmiri language: Wikipedia, the free encyclopedia. Retrieved February 04, 2020, from https:\/\/en.wikipedia.org\/w\/index.php?title=Kashmiri-language&oldid=942627183."},{"key":"9860_CR34","unstructured":"Wikipedia contributors. (2020f). Malayalam: Wikipedia, the free encyclopedia. Retrieved February 03, 2020 from https:\/\/en.wikipedia.org\/w\/index.php?title=Malayalam&oldid=941882964"},{"key":"9860_CR35","unstructured":"Wikipedia contributors. (2020g). Meitei language: Wikipedia, the free encyclopedia. Retrieved February 02, 2020, from https:\/\/en.wikipedia.org\/w\/index.php?title=Meitei-language&oldid=936096557"},{"key":"9860_CR36","unstructured":"Wikipedia contributors. (2020h). Odia language: Wikipedia, the free encyclopedia. Retrieved February 03, 2020, from https:\/\/en.wikipedia.org\/w\/index.php?title=Odia-language&oldid=941768688"},{"key":"9860_CR37","unstructured":"Wikipedia contributors. (2020i). Punjabi language: Wikipedia, the free encyclopedia. Retrieved February 02, 2020, from https:\/\/en.wikipedia.org\/w\/index.php?title=Punjabi-language&oldid=941520253"},{"key":"9860_CR38","unstructured":"Wikipedia contributors. (2020j). Tamil language: Wikipedia, the free encyclopedia. Retrieved February 04, 2020, from https:\/\/en.wikipedia.org\/w\/index.php?title=Tamil_language&oldid=941234813"},{"key":"9860_CR39","unstructured":"Wikipedia contributors. (2020k). Hindi: Wikipedia, the free encyclopedia. Retrieved February 03, 2020, from https:\/\/en.wikipedia.org\/w\/index.php?title=Hindi&oldid=942598408."},{"key":"9860_CR40","unstructured":"Wikipedia contributors. (2020l). Urdu: Wikipedia, the free encyclopedia. Retrieved February 02, 2020, from https:\/\/en.wikipedia.org\/w\/index.php?title=Urdu&oldid=942705946"},{"key":"9860_CR41","unstructured":"Wikipedia contributors. (2020m). Khasi: Wikipedia, the free encyclopedia. Retrieved January 15, 2020, from https:\/\/en.wikipedia.org\/w\/index.php?title=Khasi_language&oldid=914412473"},{"issue":"3","key":"9860_CR42","first-page":"1169","volume":"4","author":"C Zhang","year":"2008","unstructured":"Zhang, C., Wang, H., Liu, Y., Wu, D., Liao, Y., & Wang, B. (2008). Automatic keyword extraction from documents using conditional random fields. Journal of Computational Information Systems, 4(3), 1169.","journal-title":"Journal of Computational Information Systems"}],"container-title":["International Journal of Speech Technology"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-021-09860-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10772-021-09860-w\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-021-09860-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,11,18]],"date-time":"2021-11-18T10:17:13Z","timestamp":1637230633000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10772-021-09860-w"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,6,4]]},"references-count":42,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2021,12]]}},"alternative-id":["9860"],"URL":"https:\/\/doi.org\/10.1007\/s10772-021-09860-w","relation":{},"ISSN":["1381-2416","1572-8110"],"issn-type":[{"value":"1381-2416","type":"print"},{"value":"1572-8110","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021,6,4]]},"assertion":[{"value":"1 October 2020","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"21 May 2021","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 June 2021","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}