{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,14]],"date-time":"2026-02-14T10:20:11Z","timestamp":1771064411349,"version":"3.50.1"},"reference-count":49,"publisher":"Informa UK Limited","issue":"2","license":[{"start":{"date-parts":[[2023,1,10]],"date-time":"2023-01-10T00:00:00Z","timestamp":1673308800000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"name":"the National Geological Big Data Aggregation and Management","award":["DD20190381"],"award-info":[{"award-number":["DD20190381"]}]}],"content-domain":{"domain":["www.tandfonline.com"],"crossmark-restriction":true},"short-container-title":["Annals of GIS"],"published-print":{"date-parts":[[2023,4,3]]},"DOI":"10.1080\/19475683.2023.2165543","type":"journal-article","created":{"date-parts":[[2023,1,10]],"date-time":"2023-01-10T13:38:28Z","timestamp":1673357908000},"page":"293-306","update-policy":"https:\/\/doi.org\/10.1080\/tandf_crossmark_01","source":"Crossref","is-referenced-by-count":14,"title":["A Levenshtein distance-based method for word segmentation in corpus augmentation of geoscience texts"],"prefix":"10.1080","volume":"29","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-6643-4053","authenticated-orcid":false,"given":"Jinqu","family":"Zhang","sequence":"first","affiliation":[{"name":"School of Computer Science, South China Normal University, Guangzhou, China"}]},{"given":"Lang","family":"Qian","sequence":"additional","affiliation":[{"name":"School of Computer Science, South China Normal University, Guangzhou, China"}]},{"given":"Shu","family":"Wang","sequence":"additional","affiliation":[{"name":"State Key Laboratory of Resources and Environmental Information System, Institute of Geographic Sciences and Natural Resources Research, Chinese Academy of Sciences, Beijing, China"}]},{"given":"Yunqiang","family":"Zhu","sequence":"additional","affiliation":[{"name":"State Key Laboratory of Resources and Environmental Information System, Institute of Geographic Sciences and Natural Resources Research, Chinese Academy of Sciences, Beijing, China"},{"name":"Jiangsu Center for Collaborative Innovation in Geographical Information Resource Development and Application, Nanjing Normal University, Nanjing, China"}]},{"given":"Zhenji","family":"Gao","sequence":"additional","affiliation":[{"name":"Technology Innovation Center of Geological Information of Ministry of Natural Resources, China Geological Survey, Beijing, China"},{"name":"Geological Information Center, Development and Research Center of China Geological Survey, Beijing, China"}]},{"given":"Hailong","family":"Yu","sequence":"additional","affiliation":[{"name":"Technology Innovation Center of Geological Information of Ministry of Natural Resources, China Geological Survey, Beijing, China"},{"name":"Geological Information Center, Development and Research Center of China Geological Survey, Beijing, China"}]},{"given":"Weirong","family":"Li","sequence":"additional","affiliation":[{"name":"State Key Laboratory of Resources and Environmental Information System, Institute of Geographic Sciences and Natural Resources Research, Chinese Academy of Sciences, Beijing, China"}]}],"member":"301","published-online":{"date-parts":[[2023,1,10]]},"reference":[{"key":"e_1_3_4_2_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.jocs.2017.11.011"},{"key":"e_1_3_4_3_1","doi-asserted-by":"publisher","DOI":"10.1109\/TNN.2007.912312"},{"key":"e_1_3_4_4_1","doi-asserted-by":"publisher","DOI":"10.1109\/72.279181"},{"key":"e_1_3_4_5_1","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/P15-1168"},{"key":"e_1_3_4_6_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D15-1141"},{"key":"e_1_3_4_7_1","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1179"},{"key":"e_1_3_4_8_1","first-page":"2493","article-title":"Natural Language Processing (Almost) from Scratch","volume":"12","author":"Collobert R.","year":"2011","unstructured":"Collobert, R., J. Weston, L. Bottou, M. Karlen, K. Kavukcuoglu, and P. Kuksa. 2011. \u201cNatural Language Processing (Almost) from Scratch.\u201d Journal of Machine Learning Research 12: 2493\u20132537.","journal-title":"Journal of Machine Learning Research"},{"key":"e_1_3_4_9_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N19-1423"},{"key":"e_1_3_4_10_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.emnlp-main.488"},{"key":"e_1_3_4_11_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P17-2090"},{"key":"e_1_3_4_12_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.findings-acl.84"},{"key":"e_1_3_4_13_1","doi-asserted-by":"publisher","DOI":"10.4028\/scientific.net\/AMR.926-930.3368"},{"key":"e_1_3_4_14_1","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1901.05287"},{"key":"e_1_3_4_15_1","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1308.0850"},{"key":"e_1_3_4_16_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2021.114769"},{"key":"e_1_3_4_17_1","doi-asserted-by":"publisher","DOI":"10.1109\/ECTICON.2008.4600388"},{"key":"e_1_3_4_18_1","first-page":"184","volume-title":"Proceedings of the Eighth International Joint Conference on Natural Language Processing","volume":"1","author":"Huang S.","year":"2017","unstructured":"Huang, S., X. Sun, and H. Wang. 2017. \u201cAddressing Domain Adaptation for Chinese Word Segmentation with Global Recurrent Structure.\u201d Proceedings of the Eighth International Joint Conference on Natural Language Processing, Taipei, Taiwan. 1. Asian Federation of Natural Language Processing. 184\u2013193."},{"key":"e_1_3_4_19_1","doi-asserted-by":"publisher","DOI":"10.1080\/19475683.2019.1675760"},{"key":"e_1_3_4_20_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-13-6861-5_47"},{"key":"e_1_3_4_21_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N18-2072"},{"key":"e_1_3_4_22_1","first-page":"282","volume-title":"Proceedings of the 18th International Conference on Machine Learning 2001 (ICML 2001)","author":"Lafferty J.","year":"2001","unstructured":"Lafferty, J., A. McCallum, and C. N. P. Fernando 2001. \u201cConditional Random Fields: Probabilistic Models for Segmenting and Labeling Sequence Data.\u201d Proceedings of the 18th International Conference on Machine Learning 2001 (ICML 2001).\u201c Williamstown, Massachusetts. Morgan Kaufmann Publishers Inc. 282\u2013289."},{"key":"e_1_3_4_23_1","doi-asserted-by":"publisher","DOI":"10.1136\/amiajnl-2013-002381"},{"key":"e_1_3_4_24_1","first-page":"707","article-title":"Binary Codes Capable of Correcting Deletions, Insertions and Reversals","volume":"10","author":"Levenshtein V. I.","year":"1966","unstructured":"Levenshtein, V. I. 1966. \u201cBinary Codes Capable of Correcting Deletions, Insertions and Reversals.\u201d Soviet Physics Doklady 10: 707\u2013710.","journal-title":"Soviet Physics Doklady"},{"key":"e_1_3_4_25_1","volume-title":"Proceedings of the Fourth SIGHAN Workshop on Chinese Language Processing","author":"Low J. K.","year":"2005","unstructured":"Low, J. K., Ng, H. T., and Guo, W. 2005. \u201cA Maximum Entropy Approach to Chinese Word Segmentation.\u201d Proceedings of the Fourth SIGHAN Workshop on Chinese Language Processing. https:\/\/aclanthology.org\/I05-3025"},{"key":"e_1_3_4_26_1","doi-asserted-by":"publisher","DOI":"10.1007\/s12145-021-00695-2"},{"key":"e_1_3_4_27_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i15.17611"},{"key":"e_1_3_4_28_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N18-1202"},{"key":"e_1_3_4_29_1","doi-asserted-by":"crossref","unstructured":"Phreeraphattanakarn T. and B. Kijsirikul. 2021. \u201cText Data-Augmentation Using Text Similarity with Manhattan Siamese Long Short-Term Memory for Thai Language.\u201d Journal of Physics: Conference Series. IOP Publishing: pp: 012018.","DOI":"10.1088\/1742-6596\/1780\/1\/012018"},{"key":"e_1_3_4_30_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.cageo.2018.08.006"},{"key":"e_1_3_4_31_1","doi-asserted-by":"publisher","DOI":"10.1029\/2019EA000993"},{"key":"e_1_3_4_32_1","doi-asserted-by":"publisher","DOI":"10.1109\/TNB.2019.2908678"},{"key":"e_1_3_4_33_1","doi-asserted-by":"publisher","DOI":"10.1145\/3357384.3358040"},{"key":"e_1_3_4_34_1","first-page":"86","volume-title":"Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics","volume":"1","author":"Sennrich R.","year":"2015","unstructured":"Sennrich, R., B. Haddow, and A. Birch. 2015. \u201cImproving Neural Machine Translation Models with Monolingual Data.\u201c Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics, Berlin, Germany. 1. Association for Computational Linguistics. 86\u201396."},{"key":"e_1_3_4_35_1","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1909.10649"},{"key":"e_1_3_4_36_1","unstructured":"Vaswani A. N. Shazeer N. Parmar J. Uszkoreit L. Jones A. N. Gomez \u0141. Kaiser and I. Polosukhin. 2017. \u201cAttention is All You Need.\u201d Advances in neural information processing systems. pp: 5998\u20136008."},{"key":"e_1_3_4_37_1","first-page":"87","article-title":"Deep Learning-Based Text Segmentation in NLP Using Fast Recurrent Neural Network with Bi-LSTM","volume":"38","author":"Vinotheni C.","year":"2021","unstructured":"Vinotheni, C., and S. LakshmanaPandian. 2021. \u201cDeep Learning-Based Text Segmentation in NLP Using Fast Recurrent Neural Network with Bi-LSTM.\u201d Smart Intelligent Computing and Communication Technology 38. 87\u201393. Advances in Parallel Computing.","journal-title":"Smart Intelligent Computing and Communication Technology"},{"key":"e_1_3_4_38_1","first-page":"163","volume-title":"Proceedings of the Eighth International Joint Conference on Natural Language Processing","author":"Wang C.","year":"2017","unstructured":"Wang, C., and B. Xu. 2017. \u201cConvolutional Neural Network with Word Embeddings for Chinese Word Segmentation.\u201c Proceedings of the Eighth International Joint Conference on Natural Language Processing, Taipei, Taiwan. Asian Federation of Natural Language Processing. 163\u2013172."},{"key":"e_1_3_4_39_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.naacl-main.434"},{"key":"e_1_3_4_40_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1670"},{"key":"e_1_3_4_41_1","first-page":"1812","article-title":"Clinical Named Entity Recognition Using Deep Learning Models","volume":"2017","author":"Wu Y.","year":"2018","unstructured":"Wu, Y., M. Jiang, J. Xu, D. Zhi, and H. Xu. 2018. \u201cClinical Named Entity Recognition Using Deep Learning Models.\u201d AMIA Annual Symposium Proceedings \/ AMIA Symposium AMIA Symposium 2017. 1812\u20131819. 2017.","journal-title":"AMIA Annual Symposium Proceedings \/ AMIA Symposium AMIA Symposium"},{"issue":"1","key":"e_1_3_4_42_1","first-page":"29","article-title":"Chinese Word Segmentation as Character Tagging","volume":"8","author":"Xue N. W.","year":"2003","unstructured":"Xue, N. W. 2003. \u201cChinese Word Segmentation as Character Tagging.\u201d Computational Linguistics and Chinese Language Processing 8 (1): 29\u201347.","journal-title":"Computational Linguistics and Chinese Language Processing"},{"key":"e_1_3_4_43_1","doi-asserted-by":"publisher","DOI":"10.3115\/1118824.1118839"},{"key":"e_1_3_4_44_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46681-1_42"},{"key":"e_1_3_4_45_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.jbi.2016.02.011"},{"issue":"2","key":"e_1_3_4_46_1","first-page":"343","article-title":"Geological Entity Recognition Method Based on Deep Belief Networks","volume":"34","author":"Zhang X.","year":"2018","unstructured":"Zhang, X., Y. Peng, S. Wang, and M. Du. 2018. \u201cGeological Entity Recognition Method Based on Deep Belief Networks.\u201d Acta Petrologica Sinica 34 (2): 343\u2013351.","journal-title":"Acta Petrologica Sinica"},{"key":"e_1_3_4_47_1","first-page":"158","volume-title":"Proceedings of the Fifth SIGHAN Workshop on Chinese Language Processing","author":"Zhang S.","year":"2006","unstructured":"Zhang, S., Y. Qin, J. Wen, and X. Wang. 2006. \u201cWord Segmentation and Named Entity Recognition for Sighan Bakeoff3.\u201d Proceedings of the Fifth SIGHAN Workshop on Chinese Language Processing, Sydney, Australia. Association for Computational Linguistics. 158\u2013161."},{"key":"e_1_3_4_48_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.emnlp-main.691"},{"issue":"6","key":"e_1_3_4_49_1","first-page":"1528","article-title":"A New Chinese Word Segmentation Method Based on Maximum Matching","volume":"9","author":"Zhao Y.","year":"2018","unstructured":"Zhao, Y., H. Li, S. Yin, and Y. Sun. 2018. \u201cA New Chinese Word Segmentation Method Based on Maximum Matching.\u201d Journal of Information Hiding and Multimedia Signal Processing 9 (6): 1528\u20131535.","journal-title":"Journal of Information Hiding and Multimedia Signal Processing"},{"key":"e_1_3_4_50_1","doi-asserted-by":"publisher","DOI":"10.1080\/19475683.2019.1670735"}],"container-title":["Annals of GIS"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.tandfonline.com\/doi\/pdf\/10.1080\/19475683.2023.2165543","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,10,13]],"date-time":"2023-10-13T12:42:59Z","timestamp":1697200979000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.tandfonline.com\/doi\/full\/10.1080\/19475683.2023.2165543"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,1,10]]},"references-count":49,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2023,4,3]]}},"alternative-id":["10.1080\/19475683.2023.2165543"],"URL":"https:\/\/doi.org\/10.1080\/19475683.2023.2165543","relation":{},"ISSN":["1947-5683","1947-5691"],"issn-type":[{"value":"1947-5683","type":"print"},{"value":"1947-5691","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,1,10]]},"assertion":[{"value":"The publishing and review policy for this title is described in its Aims & Scope.","order":1,"name":"peerreview_statement","label":"Peer Review Statement"},{"value":"http:\/\/www.tandfonline.com\/action\/journalInformation?show=aimsScope&journalCode=tagi20","URL":"http:\/\/www.tandfonline.com\/action\/journalInformation?show=aimsScope&journalCode=tagi20","order":2,"name":"aims_and_scope_url","label":"Aim & Scope"},{"value":"2021-08-05","order":0,"name":"received","label":"Received","group":{"name":"publication_history","label":"Publication History"}},{"value":"2023-01-02","order":1,"name":"accepted","label":"Accepted","group":{"name":"publication_history","label":"Publication History"}},{"value":"2023-01-10","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}