{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,5]],"date-time":"2024-09-05T11:36:49Z","timestamp":1725536209747},"publisher-location":"Berlin, Heidelberg","reference-count":20,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642030390"},{"type":"electronic","value":"9783642030406"}],"license":[{"start":{"date-parts":[[2009,1,1]],"date-time":"2009-01-01T00:00:00Z","timestamp":1230768000000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2009]]},"DOI":"10.1007\/978-3-642-03040-6_78","type":"book-chapter","created":{"date-parts":[[2009,7,30]],"date-time":"2009-07-30T08:16:37Z","timestamp":1248941797000},"page":"639-646","source":"Crossref","is-referenced-by-count":1,"title":["An Automatic Intelligent Language Classifier"],"prefix":"10.1007","author":[{"given":"Brijesh","family":"Verma","sequence":"first","affiliation":[]},{"given":"Hong","family":"Lee","sequence":"additional","affiliation":[]},{"given":"John","family":"Zakos","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"doi-asserted-by":"crossref","unstructured":"Artemenko, O., Mandl, T., Shramko, M., Womser-Hacker, C.: Evaluation of a language identification system for mono- and multilingual text documents. In: Proceedings of the 2006 ACM symposium on applied computing, pp. 859\u2013860 (2006)","key":"78_CR1","DOI":"10.1145\/1141277.1141473"},{"unstructured":"Dunning, T.: Statistical identification of language, Technical report CRL MCCS-94-273, New Mexico State University, Computing Research Lab (March 1994)","key":"78_CR2"},{"doi-asserted-by":"crossref","unstructured":"Hakkinen, J., Tian, J.: N-gram and decision tree based language identification for written words. In: IEEE workshop on automatic speech recognition and understanding (ASRU 2001), pp. 335\u2013338 (2001)","key":"78_CR3","DOI":"10.1109\/ASRU.2001.1034655"},{"doi-asserted-by":"crossref","unstructured":"Lins, R., Goncalves, P.: Automatic language identification of written texts. In: Proceedings of the 2004 ACM symposium on applied computing, pp. 1128\u20131133 (2004)","key":"78_CR4","DOI":"10.1145\/967900.968129"},{"issue":"5","key":"78_CR5","doi-asserted-by":"publisher","first-page":"1799","DOI":"10.1016\/j.patcog.2007.10.017","volume":"41","author":"S. Lu","year":"2008","unstructured":"Lu, S., Tan, C.L.: Retrieval of machine-printed Latin documents through word shape coding. Pattern Recognition\u00a041(5), 1799\u20131809 (2008)","journal-title":"Pattern Recognition"},{"doi-asserted-by":"crossref","unstructured":"Martins, B., Silva, M.: Language identification in web pages. In: Proceedings of the 2005 ACM symposium on applied computing, pp. 764\u2013768 (2005)","key":"78_CR6","DOI":"10.1145\/1066677.1066852"},{"issue":"3","key":"78_CR7","first-page":"94","volume":"20","author":"P. McNamee","year":"2005","unstructured":"McNamee, P.: Language identification: a solved problem suitable for undergraduate instruction. J. Comput. Small Coll.\u00a020(3), 94\u2013101 (2005)","journal-title":"J. Comput. Small Coll."},{"key":"78_CR8","doi-asserted-by":"publisher","first-page":"33","DOI":"10.1109\/79.317925","volume":"11","author":"Y. Muthusamy","year":"1994","unstructured":"Muthusamy, Y., Barnard, E., Cole, R.: Automatic language identification: a review\/tutorial. IEEE Signal Processing\u00a011, 33\u201341 (1994)","journal-title":"IEEE Signal Processing"},{"doi-asserted-by":"crossref","unstructured":"Poutsma, A.: Applying monte carlo techniques to language identification. In: Proceedings of computational linguistics in the Netherlands (CLIN), vol.\u00a045, pp. 179\u2013189 (2001)","key":"78_CR9","DOI":"10.1163\/9789004334038_015"},{"unstructured":"Prager, J.L.: Language identification for multilingual documents. In: Proceedings of the 32nd annual Hawaii international conference on system sciences, vol.\u00a02, p. 2035 (1999)","key":"78_CR10"},{"doi-asserted-by":"crossref","unstructured":"Qu, Y., Grefenstette, G.: Finding ideographic representations of Japanese names written in Latin script via language identification and corpus validation. In: Proceedings of the 42nd annual meeting on association for computational linguistics, p. 183 (2004)","key":"78_CR11","DOI":"10.3115\/1218955.1218979"},{"issue":"9","key":"78_CR12","doi-asserted-by":"publisher","first-page":"697","DOI":"10.1016\/j.specom.2007.04.006","volume":"49","author":"H. Romsdorfer","year":"2007","unstructured":"Romsdorfer, H., Pfister, B.: Text analysis and language identification for polyglot text-to-speech synthesis. Speech communication\u00a049(9), 697\u2013724 (2007)","journal-title":"Speech communication"},{"key":"78_CR13","doi-asserted-by":"publisher","first-page":"69","DOI":"10.1016\/j.ins.2003.03.003","volume":"158","author":"A. Selamat","year":"2004","unstructured":"Selamat, A., Omatu, S.: Web page feature selection and classification using neural networks. Information sciences\u00a0158, 69\u201388 (2004)","journal-title":"Information sciences"},{"doi-asserted-by":"crossref","unstructured":"Selamat, A., Ching, N.C., Mikami, Y.: Arabic script web documents language identification using decision tree-ARTMAP model. In: IEEE International conference on convergence information technology, pp. 721\u2013726 (2007)","key":"78_CR14","DOI":"10.1109\/ICCIT.2007.402"},{"unstructured":"The Unicode Consortium. The Unicode Standard, Version 5.0, 5th edn. Addison-Wesley Professional, Reading (2006)","key":"78_CR15"},{"unstructured":"Unicode (June 26, 2008), Wikipedia, http:\/\/en.wikipedia.org\/wiki\/Unicode (Retrieved June 27, 2008)","key":"78_CR16"},{"unstructured":"Unicode\/UTF-8-character table, UTF8-CharTable, http:\/\/www.utf8-chartable.de\/unicode-utf8-table.pl (Retrieved June 26, 2008)","key":"78_CR17"},{"unstructured":"UTF-8 (June 24, 2008). Wikipedia: http:\/\/en.wikipedia.org\/wiki\/UTF-8 (Retrieved June 26, 2008)","key":"78_CR18"},{"issue":"3","key":"78_CR19","doi-asserted-by":"publisher","first-page":"583","DOI":"10.1016\/j.patcog.2003.05.001","volume":"37","author":"A. Xafopoulos","year":"2004","unstructured":"Xafopoulos, A., Kotropoulos, C., Almpanidis, G., Pitas, I.: Language identification in web documents using discrete HMMs. Pattern recognition\u00a037(3), 583\u2013594 (2004)","journal-title":"Pattern recognition"},{"doi-asserted-by":"crossref","unstructured":"Yergeau, F.: UTF-8, a transformation format of ISO 10646. In: RFC 3629, internet engineering task force (2003)","key":"78_CR20","DOI":"10.17487\/rfc3629"}],"container-title":["Lecture Notes in Computer Science","Advances in Neuro-Information Processing"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-03040-6_78","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,5,21]],"date-time":"2019-05-21T15:44:22Z","timestamp":1558453462000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-03040-6_78"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2009]]},"ISBN":["9783642030390","9783642030406"],"references-count":20,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-03040-6_78","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2009]]}}}