{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T07:39:43Z","timestamp":1740123583098,"version":"3.37.3"},"reference-count":118,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2021,3,14]],"date-time":"2021-03-14T00:00:00Z","timestamp":1615680000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,3,14]],"date-time":"2021-03-14T00:00:00Z","timestamp":1615680000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Artif Intell Rev"],"published-print":{"date-parts":[[2022,2]]},"DOI":"10.1007\/s10462-021-09983-1","type":"journal-article","created":{"date-parts":[[2021,3,14]],"date-time":"2021-03-14T09:04:18Z","timestamp":1615712658000},"page":"1085-1120","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":5,"title":["Postal address extraction from the web: a comprehensive survey"],"prefix":"10.1007","volume":"55","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8430-1000","authenticated-orcid":false,"given":"Mohammed","family":"Kayed","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sara","family":"Dakrory","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"A. A.","family":"Ali","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2021,3,14]]},"reference":[{"key":"9983_CR1","doi-asserted-by":"publisher","first-page":"309","DOI":"10.1016\/j.compenvurbsys.2017.03.007","volume":"64","author":"E Acheson","year":"2017","unstructured":"Acheson E, De Sabbata S, Purves RS (2017) A quantitative analysis of global gazetteers: patterns of coverage for common feature types. Comput Environ Urban Syst 64:309\u2013320. https:\/\/doi.org\/10.1016\/j.compenvurbsys.2017.03.007","journal-title":"Comput Environ Urban Syst"},{"key":"9983_CR2","doi-asserted-by":"crossref","unstructured":"Ahlers D (2013, November). Assessment of the accuracy of GeoNames gazetteer data. In Proceedings of the 7th workshop on geographic information retrieval (pp. 74-81). ACM","DOI":"10.1145\/2533888.2533938"},{"key":"9983_CR3","unstructured":"Dirk Ahlers (2013) Business entity retrieval and data provision for yellow pages by local search. In IRPS Workshop (ECIR2013)"},{"key":"9983_CR4","unstructured":"Ahlers D, Boll S (2009), On the accuracy of online geocoders. Geoinformatik"},{"key":"9983_CR5","doi-asserted-by":"publisher","unstructured":"Ahlers D, Boll S (2008), Retrieving address-based locations from the Web. In Proceeding of the 2nd international workshop on geographic information retrieval - GIR \u201908, 27. https:\/\/doi.org\/10.1145\/1460007.1460015","DOI":"10.1145\/1460007.1460015"},{"key":"9983_CR6","doi-asserted-by":"publisher","unstructured":"Ahlers D, Boll S (2008), Urban Web Crawling. First international workshop on location and the web (LocWeb 2008), 25\u201332. https:\/\/doi.org\/10.1145\/1367798.1367803","DOI":"10.1145\/1367798.1367803"},{"key":"9983_CR7","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-84628-827-2_6","author":"D Ahlers","year":"2007","unstructured":"Ahlers D, Boll S (2007) Location-based web Search. The Geospatial Web. https:\/\/doi.org\/10.1007\/978-1-84628-827-2_6","journal-title":"The Geospatial Web"},{"key":"9983_CR8","first-page":"32","volume-title":"Human language technology conference and conference on empirical methods in natural language processing, 6\u20138 October 2005","author":"Popescu AM, Nguyen B, Etzioni O (2005) OPINE: Extracting Product Features and Opinions from Reviews. Proc. of the HLT\/EMNLP","year":"2005","unstructured":"Popescu AM, Nguyen B, Etzioni O (2005) OPINE: Extracting Product Features and Opinions from Reviews. Proc. of the HLT\/EMNLP (2005) Human language technology conference and conference on empirical methods in natural language processing, 6\u20138 October 2005. Vancouver, British Columbia, Canada, pp 32\u201333"},{"key":"9983_CR9","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-78849-2_41","author":"S Asadi","year":"2008","unstructured":"Asadi S, Yang G, Zhou X, Shi Y, Zhai B, Jiang WWR (2008) Pattern-based extraction of addresses from Web page content. Lecture notes in computer science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics). https:\/\/doi.org\/10.1007\/978-3-540-78849-2_41","journal-title":"Lecture notes in computer science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)"},{"key":"9983_CR10","doi-asserted-by":"publisher","unstructured":"Babych B, Hartley A, (2003) Improving machine translation quality with automatic named entity recognition. In proceedings of the 7th international EAMT workshop on MT and other language technology tools, improving MT through other language technology tools resources and tools for building MT - EAMT \u201903 (pp. 1\u20138), Morristown, NJ, USA: Association for Computational Linguistics. https:\/\/doi.org\/10.3115\/1609822.1609823","DOI":"10.3115\/1609822.1609823"},{"key":"9983_CR11","doi-asserted-by":"publisher","unstructured":"Bakshi R, Knoblock CA, Thakkar S (2005) Exploiting online sources to accurately geocode addresses. Proceedings of the 12th annual ACM international workshop on geographic information systems, 194, https:\/\/doi.org\/10.1145\/1032222.1032251","DOI":"10.1145\/1032222.1032251"},{"issue":"17","key":"9983_CR12","doi-asserted-by":"publisher","first-page":"6976","DOI":"10.1016\/j.eswa.2013.06.047","volume":"40","author":"E Baralis","year":"2013","unstructured":"Baralis E, Cagliero L, Jabeen S, Fiori A, Shah S (2013) Multi-document summarization based on the Yago ontology. Expert Syst Appl 40(17):6976\u20136984. https:\/\/doi.org\/10.1016\/j.eswa.2013.06.047","journal-title":"Expert Syst Appl"},{"key":"9983_CR13","doi-asserted-by":"crossref","unstructured":"Bellini P, Benigni M, Billero R, Nesi P, Rauch N (2014) Ontology construction and knowledge base feeding and cleaning for smart-city services. IEEE 19 Int. Conf. on Engineering of complex computer systems (ICECCS 2014)","DOI":"10.1109\/ICECCS.2014.33"},{"issue":"5","key":"9983_CR14","doi-asserted-by":"publisher","first-page":"926","DOI":"10.1109\/TASL.2009.2019927","volume":"17","author":"Y Benajiba","year":"2009","unstructured":"Benajiba Y, Rosso P, Diab M (2009) Arabic named entity recognition: a feature-driven study. IEEE Trans Audio Speech Language Process 17(5):926\u2013934. https:\/\/doi.org\/10.1109\/TASL.2009.2019927","journal-title":"IEEE Trans Audio Speech Language Process"},{"issue":"13","key":"9983_CR15","first-page":"1830","volume":"21","author":"J Betina Antony","year":"2015","unstructured":"Betina Antony J, Mahalakshmi GS (2015) Content-based information retrieval by named entity recognition and verb semantic role labelling. J Univ Comput Sci 21(13):1830\u20131848","journal-title":"J Univ Comput Sci"},{"key":"9983_CR16","doi-asserted-by":"publisher","DOI":"10.3115\/974557.974586","author":"DM Bikel","year":"1997","unstructured":"Bikel DM, Miller S, Schwartz R, Weischedel R (1997) Nymble: a high-performance learning name-finder. Proceedings of the fifth conference on applied natural language processing. https:\/\/doi.org\/10.3115\/974557.974586","journal-title":"Proceedings of the fifth conference on applied natural language processing"},{"issue":"3","key":"9983_CR17","doi-asserted-by":"publisher","first-page":"221","DOI":"10.1023\/A:1011482030093","volume":"5","author":"KAV Borges","year":"2001","unstructured":"Borges KAV, Davis CA, Laender AHF (2001) OMT-G: an object-oriented data model for geographic applications. GeoInformatica 5(3):221\u2013260. https:\/\/doi.org\/10.1023\/A:1011482030093","journal-title":"GeoInformatica"},{"key":"9983_CR18","doi-asserted-by":"publisher","unstructured":"Borges KAVV, Laender AHFF, Medeiros CBand Davis Jr., Ca (2007), Discovering geographic locations in Web pages using urban addresses. GIR \u201907 proceedings of the 4th ACM workshop on geographical information retrieval, 31\u201336. https:\/\/doi.org\/10.1145\/1316948.1316957","DOI":"10.1145\/1316948.1316957"},{"issue":"4","key":"9983_CR19","doi-asserted-by":"publisher","first-page":"609","DOI":"10.1007\/s10707-010-0118-z","volume":"15","author":"KAV Borges","year":"2011","unstructured":"Borges KAV, Davis CA, Laender AHFand Medeiros CB, (2011) Ontology-driven discovery of geospatial evidence in web pages. GeoInformatica 15(4):609\u2013631. https:\/\/doi.org\/10.1007\/s10707-010-0118-z","journal-title":"GeoInformatica"},{"issue":"2","key":"9983_CR20","doi-asserted-by":"publisher","first-page":"175","DOI":"10.1145\/376284.375682","volume":"30","author":"V Borkar","year":"2001","unstructured":"Borkar V, Deshmukh K, Sarawagi S (2001) Automatic segmentation of text into structured records. ACM SIGMOD Record 30(2):175\u2013186. https:\/\/doi.org\/10.1145\/376284.375682","journal-title":"ACM SIGMOD Record"},{"key":"9983_CR21","unstructured":"Borthwick A, Sterling J, Agichtein E, Grishman R (1998) Exploiting diverse knowledge sources via maximum entropy in named entity recognition. Proceedings of the 6th workshop on very large Corpora, 152\u2013160. http:\/\/acl.ldc.upenn.edu\/W\/W98\/W98-1118.pdf"},{"key":"9983_CR22","unstructured":"Cai D, Yu S, Wen JR, Ma WY (2003) Vips: a vision-based page segmentation algorithm. Technical Report, MSR-TR-2003-79. https:\/\/www.microsoft.com\/en-us\/research\/wp-content\/uploads\/2016\/02\/tr-2003-79.pdf"},{"key":"9983_CR23","doi-asserted-by":"publisher","unstructured":"Cai D, He X, Wen JR, Ma WY (2004, July). Block-level link analysis. In Proceedings of the 27th annual international ACM SIGIR conference on research and development in information retrieval (pp. 440-447). https:\/\/doi.org\/10.1145\/1008992.1009068","DOI":"10.1145\/1008992.1009068"},{"key":"9983_CR24","doi-asserted-by":"publisher","unstructured":"Cai D, Yu S, Wen J-R, Ma W-Y (2004) Block-based Web search. Proceedings of the 27th annual international ACM SIGIR conference on research and development in information retrieval, 456\u2013463. https:\/\/doi.org\/10.1145\/1008992.1009070","DOI":"10.1145\/1008992.1009070"},{"key":"9983_CR25","first-page":"925","volume":"3399","author":"WT Cai","year":"2005","unstructured":"Cai WT, Wang SR, Jiang QS (2005) Address extraction: extraction of location-based information from the web. Web Technol Res Dev - Apweb 3399:925\u2013937","journal-title":"Web Technol Res Dev - Apweb"},{"key":"9983_CR26","doi-asserted-by":"publisher","DOI":"10.1109\/ICMLC.2004.1382024","author":"W Cai","year":"2004","unstructured":"Cai W, Wang S, Jiang Q (2004) Address extraction: a graph matching and ontology-based approach to conceptual information retrieval. Proceedings of international conference on machine learning and cybernetics. https:\/\/doi.org\/10.1109\/ICMLC.2004.1382024","journal-title":"Proceedings of international conference on machine learning and cybernetics"},{"key":"9983_CR27","unstructured":"Can L, Qian Z, Xiaofeng M, Wenyin L (2005) Postal address detection from web documents. International workshop on challenges in web information retrieval and integration, 40\u201345. http:\/\/dl.acm.org\/citation.cfm?id=1105926.1106228"},{"key":"9983_CR28","first-page":"51","volume-title":"Australasian language technology workshop 2006, November 30-December 1, 2006","author":"Cavedon IL, Zukerman I, Moll D, Zaanen M Van, Smith D, (2006) Named entity recognition for question answering. Proc. of the","year":"2006","unstructured":"Cavedon IL, Zukerman I, Moll D, Zaanen M Van, Smith D, (2006) Named entity recognition for question answering. Proc. of the (2006) Australasian language technology workshop 2006, November 30-December 1, 2006. Sancta Sophia College. Sydney. Australasian Language Technology Association, Carlton, Vic, pp 51\u201358"},{"issue":"2","key":"9983_CR29","doi-asserted-by":"publisher","first-page":"93","DOI":"10.1080\/17445760802429585","volume":"25","author":"J Cao","year":"2010","unstructured":"Cao J, Mao B, Luo J (2010) A segmentation method for web page analysis using shrinking and dividing. Int J Parallel Emerg Distributed Syst 25(2):93\u2013104. https:\/\/doi.org\/10.1080\/17445760802429585","journal-title":"Int J Parallel Emerg Distributed Syst"},{"key":"9983_CR30","doi-asserted-by":"publisher","unstructured":"Chakrabarti D, Kumar R, Punera K (2008, April) A graph-theoretic approach to webpage segmentation. In Proceedings of the 17th international conference on World Wide Web (pp. 377-386). https:\/\/doi.org\/10.1145\/1367497.1367549","DOI":"10.1145\/1367497.1367549"},{"key":"9983_CR31","doi-asserted-by":"publisher","unstructured":"Chang CH, Li SY (2010), MapMarker: Extraction of postal addresses and associated information for general Web pages. Proceedings - 2010 IEEE\/WIC\/ACM international conference on web intelligence, WI 2010, 1, 105\u2013111. https:\/\/doi.org\/10.1109\/WI-IAT.2010.64","DOI":"10.1109\/WI-IAT.2010.64"},{"key":"9983_CR32","unstructured":"Chang C-H, Huang C-Y, Su Y-S (2012) On Chinese postal address and associated information extraction. The 26th annual conference of the Japanese society for artificial intelligence"},{"key":"9983_CR33","doi-asserted-by":"publisher","unstructured":"Chieu HL, Ng HT (2002) Named entity recognition: a maximum entropy approach using global information. Coling \u201902, 1, 1\u20137. https:\/\/doi.org\/10.3115\/1072228.1072253","DOI":"10.3115\/1072228.1072253"},{"key":"9983_CR34","unstructured":"Chinchor N, Robinson P (1997, September). MUC-7 named entity task definition. In proceedings of the 7th conference on message understanding (Vol. 29, pp. 1-21)"},{"issue":"2003","key":"9983_CR35","doi-asserted-by":"publisher","first-page":"357","DOI":"10.3115\/1119176.1119204","volume":"4","author":"JPC Chiu","year":"2016","unstructured":"Chiu JPC, Nichols E (2016) Named entity recognition with bidirectional LSTM-CNNs, transactions of the association for. Comput Linguist 4(2003):357\u2013370. https:\/\/doi.org\/10.3115\/1119176.1119204","journal-title":"Comput Linguist"},{"key":"9983_CR36","unstructured":"Choi FY, Wiemer-Hastings P, Moore JD (2001) Latent semantic analysis for text segmentation. In Proceedings of the 2001 conference on empirical methods in natural language processing"},{"key":"9983_CR37","doi-asserted-by":"publisher","unstructured":"Chu WW (2013) Erratum: data mining and knowledge discovery for big data. Data mining and knowledge discovery for big data pp 305-308. https:\/\/doi.org\/10.1007\/978-3-642-40837-3_10","DOI":"10.1007\/978-3-642-40837-3_10"},{"key":"9983_CR38","doi-asserted-by":"crossref","unstructured":"Chang C-H, Kayed M, Girgis MR, Shaalan KF (2006) A survey of web information extraction systems, IEEE transactions on knowledge and data engineering, 18(10): pp. 1411\u20131428. https:\/\/ieeexplore.ieee.org\/document\/1683775","DOI":"10.1109\/TKDE.2006.152"},{"issue":"3","key":"9983_CR39","doi-asserted-by":"publisher","first-page":"539","DOI":"10.1007\/s10489-015-0707-5","volume":"44","author":"C-H Chang","year":"2016","unstructured":"Chang C-H, Chuang HM, Huang CY, Su YS, Li SY (2016) Enhancing POI search on maps via online address extraction and associated information segmentation. Appl Intell 44(3):539\u2013556. https:\/\/doi.org\/10.1007\/s10489-015-0707-5","journal-title":"Appl Intell"},{"key":"9983_CR40","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10491-1_2","author":"H-M Chuang","year":"2014","unstructured":"Chuang H-M, Chang C-H, Kao T-Y (2014) Effective web crawling for chinese addresses and associated information. Int Conf Electron Commerce Web Technol. https:\/\/doi.org\/10.1007\/978-3-319-10491-1_2","journal-title":"Int Conf Electron Commerce Web Technol"},{"issue":"7","key":"9983_CR41","doi-asserted-by":"publisher","first-page":"1405","DOI":"10.1080\/13658816.2015.1133820","volume":"30","author":"H Chuang","year":"2016","unstructured":"Chuang H, Chang C, Kao T, Cheng C, Cheong K (2016) Enabling maps\/location searches on mobile devices- constructing a POI database via focused crawling and information extraction. Int J Geogr Inform Sci 30(7):1405\u20131425. https:\/\/doi.org\/10.1080\/13658816.2015.1133820","journal-title":"Int J Geogr Inform Sci"},{"key":"9983_CR42","unstructured":"Cunningham H, Maynard D, Bontcheva K, ACL VT (2002) GATE: A framework and graphical development environment for robust NLP tools and applications. Proceedings of the 40th annual meeting of the association for computational linguistics, July 6-12, 2002, Philadelphia, PA, USA. http:\/\/www.aclweb.org\/anthology\/P\/P02\/P02-1022.pdf"},{"issue":"1","key":"9983_CR43","doi-asserted-by":"publisher","first-page":"103","DOI":"10.1007\/s10707-006-0015-7","volume":"11","author":"CA Davis","year":"2007","unstructured":"Davis CA, Fonseca FT (2007) Assessing the certainty of locations produced by an address geocoding system. GeoInformatica 11(1):103\u2013129. https:\/\/doi.org\/10.1007\/s10707-006-0015-7","journal-title":"GeoInformatica"},{"issue":"4","key":"9983_CR44","doi-asserted-by":"publisher","first-page":"387","DOI":"10.1111\/j.1467-9671.2010.01212.x","volume":"14","author":"R Devillers","year":"2010","unstructured":"Devillers R, Stein A, B\u00e9dard Y, Chrisman N, Fisher P, Shi W (2010) Thirty years of research on satial data quality achievements, failures, and opportunities. Trans GIS 14(4):387\u2013400. https:\/\/doi.org\/10.1111\/j.1467-9671.2010.01212.x","journal-title":"Trans GIS"},{"issue":"8","key":"9983_CR45","doi-asserted-by":"publisher","first-page":"1631","DOI":"10.1080\/13658816.2018.1447671","volume":"32","author":"R Ding","year":"2018","unstructured":"Ding R, Chen Z (2018) RecNet: a deep neural network for personalized POI recommendation in location-based social networks. Int J Geogr Inform Sci 32(8):1631\u201348","journal-title":"Int J Geogr Inform Sci"},{"key":"9983_CR46","doi-asserted-by":"crossref","unstructured":"Du L, Pate JK, Johnson M (2015, February). Topic segmentation with an ordering-based topic model. In 29th AAAI conference on artificial intelligence","DOI":"10.1609\/aaai.v29i1.9502"},{"key":"9983_CR47","doi-asserted-by":"crossref","unstructured":"Efremova J, Endres I, Vidas I, Melnik O (2018, July) A geo-tagging framework for address extraction from Web pages. In industrial conference on data mining (pp. 288-295)","DOI":"10.1007\/978-3-319-95786-9_22"},{"issue":"3","key":"9983_CR48","first-page":"155","volume":"4","author":"A Ekbal","year":"2010","unstructured":"Ekbal A, Bandyopadhyay S (2010) Named entity recognition using support vector machine a language independent approach. Int J Electr Comput Eng 4(3):155\u2013170","journal-title":"Int J Electr Comput Eng"},{"issue":"1","key":"9983_CR49","doi-asserted-by":"publisher","first-page":"91","DOI":"10.1016\/j.artint.2005.03.001","volume":"165","author":"O Etzioni","year":"2005","unstructured":"Etzioni O, Cafarella M, Downey D, Popescu AM, Shaked T, Soderland S, Yates A (2005) Unsupervised named-entity extraction from the Web: an experimental study. Artif Intell 165(1):91\u2013134. https:\/\/doi.org\/10.1016\/j.artint.2005.03.001","journal-title":"Artif Intell"},{"key":"9983_CR50","unstructured":"Faloutsos C, Oard DW (1998) A survey of information retrieval and filtering methods. A J Comp Educ, 1\u201324. http:\/\/drum.lib.umd.edu\/handle\/1903\/436"},{"key":"9983_CR51","unstructured":"Fan Y, Pang L, Hou J, Guo J, Lan Y, Cheng X. Matchzoo: A toolkit for deep text matching. arXiv preprint arXiv:1707.07270. 2017 Jul 23"},{"key":"9983_CR52","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1109\/ICNLSP.2018.8374393","volume":"2018","author":"AA Freihat","year":"2018","unstructured":"Freihat AA, Bella G, Mubarak H, Giunchiglia F (2018) A single-model approach for Arabic segmentation, POS tagging, and named entity recognition. The 2nd International conference on natural language and speech processing. ICNLSP 2018:1\u20138. https:\/\/doi.org\/10.1109\/ICNLSP.2018.8374393","journal-title":"ICNLSP"},{"key":"9983_CR53","doi-asserted-by":"publisher","unstructured":"Freitag D, McCallum AK (1999) Information extraction using HMMs and shrinkage. AAAI99 workshop on machine learning for information extraction, 31\u201336. https:\/\/doi.org\/10.1017\/CBO9781107415324.004","DOI":"10.1017\/CBO9781107415324.004"},{"key":"9983_CR54","doi-asserted-by":"publisher","DOI":"10.1016\/j.compenvurbsys.2014.02.004","author":"S Gao","year":"2014","unstructured":"Gao S, Li L, Li W, Janowicz K, Zhang Y (2014) Computers, environment and urban systems Cconstructing gazetteers from volunteered Big geo-data based on Hadoop. Comput Environ Urban Syst. https:\/\/doi.org\/10.1016\/j.compenvurbsys.2014.02.004","journal-title":"Comput Environ Urban Syst"},{"key":"9983_CR55","doi-asserted-by":"crossref","unstructured":"Goodchild MF (1992). Geographical data modeling. Computers Geosciences, 401\u2013408. https:\/\/www.sciencedirect.com\/science\/article\/pii\/0098300492900694","DOI":"10.1016\/0098-3004(92)90069-4"},{"issue":"4","key":"9983_CR56","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1007\/s10708-007-9111-y","volume":"69","author":"MF Goodchild","year":"2007","unstructured":"Goodchild MF (2007) Citizens as sensors: the world of volunteered geography. GeoJournal 69(4):211\u2013221. https:\/\/doi.org\/10.1007\/s10708-007-9111-y","journal-title":"GeoJournal"},{"key":"9983_CR57","doi-asserted-by":"publisher","unstructured":"Guo J, Xu G, Cheng X, Li H (2009) Named Entity Recognition in Query. Proceedings of the 32nd International ACM SIGIR conference on research and development in information retrieval - SIGIR \u201909, 267. https:\/\/doi.org\/10.1145\/1571941.1571989","DOI":"10.1145\/1571941.1571989"},{"key":"9983_CR58","doi-asserted-by":"crossref","unstructured":"Gupta S, Kaiser G, Neistadt D, Grimm P (2003, May) DOM-based content extraction of HTML documents. In proceedings of the 12th international conference on World Wide Web (pp. 207-214)","DOI":"10.1145\/775152.775182"},{"key":"9983_CR59","unstructured":"Guptill SC, Morrison JL (2013) Elements of spatial data quality"},{"issue":"4","key":"9983_CR60","doi-asserted-by":"publisher","first-page":"682","DOI":"10.1068\/b35097","volume":"37","author":"M Haklay","year":"2010","unstructured":"Haklay M (2010) How good is volunteered geographical information? A comparative study of OpenStreetMap and ordnance survey datasets. Environ Plan B: Plan Des 37(4):682\u2013703. https:\/\/doi.org\/10.1068\/b35097","journal-title":"Environ Plan B: Plan Des"},{"key":"9983_CR61","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-38634-3_8","author":"AL Han","year":"2013","unstructured":"Han AL, Wong DF, Chao LS (2013) Chinese named entity recognition with conditional random fields in the light of Chinese characteristics. Lang Process Intell Inform Syst. https:\/\/doi.org\/10.1007\/978-3-642-38634-3_8","journal-title":"Lang Process Intell Inform Syst"},{"key":"9983_CR62","doi-asserted-by":"crossref","unstructured":"Hattori G, Hoashi K, Matsumoto K, Sugaya F (2007, May) Robust web page segmentation for mobile terminal using content-distances and page layout information. In Proceedings of the 16th international conference on World Wide Web (pp. 361-370)","DOI":"10.1145\/1242572.1242622"},{"issue":"10","key":"9983_CR63","doi-asserted-by":"publisher","first-page":"2076","DOI":"10.1080\/13658816.2018.1480783","volume":"32","author":"J He","year":"2018","unstructured":"He J, Li X, Yao Y, Hong Y, Jinbao Z (2018) Mining transition rules of cellular automata for simulating urban expansion by using the deep learning techniques. Int J Geogr Inform Sci 32(10):2076\u201397","journal-title":"Int J Geogr Inform Sci"},{"key":"9983_CR64","unstructured":"Helbich M, Amelunxen C, Neis P, Zipf A, (2012) Comparative spatial analysis of positional accuracy of openStreetMap and proprietary geodata. Proceedings of GI\\_Forum, 24\u201333 http:\/\/gispoint.de\/fileadmin\/user_upload\/paper_gis_open\/537521013.pdf"},{"key":"9983_CR65","unstructured":"Hill LL (2009) Georeferencing: The geographic associations of information. Mit Press"},{"key":"9983_CR66","doi-asserted-by":"publisher","unstructured":"Hill LL, (2000) Core Elements of Digital Gazetteers: Placenames, Categories, and Footprints. The 4th European Conference, ECDL, (2000) Lisbon. Portugal. https:\/\/doi.org\/10.1007\/3-540-45268-0_26","DOI":"10.1007\/3-540-45268-0_26"},{"key":"9983_CR67","unstructured":"Huang Z, Xu W, Yu K (2015) Bidirectional LSTM-CRF Models for Sequence Tagging. ArXiv 2015. http:\/\/arxiv.org\/abs\/1508.01991"},{"key":"9983_CR68","doi-asserted-by":"publisher","unstructured":"Hui N, Hua Y, Ya-zhou T, Hao W (2009) A method of Chinese named entity recognition based on maximum entropy model. Mechatronics and automation, 2009. IEEE conference on mechatronics and automation, 2472\u20132477, https:\/\/doi.org\/10.1109\/ICMA.2009.5246408","DOI":"10.1109\/ICMA.2009.5246408"},{"issue":"3","key":"9983_CR69","doi-asserted-by":"publisher","first-page":"219","DOI":"10.1080\/13658810701626343","volume":"22","author":"CB Jones","year":"2008","unstructured":"Jones CB, Purves RS (2008) Geographical information retrieval. Int J Geogr Inform Sci 22(3):219\u2013228. https:\/\/doi.org\/10.1080\/13658810701626343","journal-title":"Int J Geogr Inform Sci"},{"key":"9983_CR70","doi-asserted-by":"crossref","unstructured":"Kayed M, Chang C-H (2010) FiVaTech: Page-Level web data extraction from template pages, IEEE Transaction on knowledge and data Eng., vol. 22, no. 2, pp. 249-263, https:\/\/ieeexplore.ieee.org\/document\/4476640\/","DOI":"10.1109\/TKDE.2009.82"},{"key":"9983_CR71","doi-asserted-by":"crossref","unstructured":"Kohlsch\u00fctter C, Nejdl W (2008, October). A densitometric approach to web page segmentation. In Proceedings of the 17th ACM conference on Information and knowledge management, 1173-1182","DOI":"10.1145\/1458082.1458237"},{"key":"9983_CR72","doi-asserted-by":"crossref","unstructured":"Kokla M, Papadias V, Tomai E. Enrichment and population of a geospatial ontology for semantic information extraction. International archives of the photogrammetry, remote sensing and spatial information sciences. 2018 Sep 19;42(4)","DOI":"10.5194\/isprs-archives-XLII-4-309-2018"},{"key":"9983_CR73","unstructured":"Kovacevic M, Diligenti M, Gori M, Milutinovic V (2002, December). Recognition of common areas in a web page using visual information: a possible application in a page classification. In 2002 IEEE international conference on data mining, 2002. Proceedings. (pp. 250-257). IEEE"},{"key":"9983_CR74","doi-asserted-by":"crossref","unstructured":"Kuhn W (2005) Geospatial semantics: why, of what, and how?. InJournal on data semantics III 2005 (pp. 1-24). Springer, Berlin, Heidelberg","DOI":"10.1007\/11496168_1"},{"key":"9983_CR75","doi-asserted-by":"crossref","unstructured":"Lample G, Ballesteros M, Subramanian S, Kawakami K, Dyer C (2016) Neural Architectures for Named Entity Recognition. Proceedings of the 2016 conference of the North American chapter of the association for computational linguistics: human language technologies arxiv: abs\/1603.01360","DOI":"10.18653\/v1\/N16-1030"},{"key":"9983_CR76","doi-asserted-by":"publisher","unstructured":"Larson RR, Frontiera P Geographic (1996) Information Retrieval and Spatial Browsing. 32nd Clinic on library applications of data processing, (January 1995), 81\u2013124 https:\/\/doi.org\/10.1145\/1008992.1009143","DOI":"10.1145\/1008992.1009143"},{"issue":"2","key":"9983_CR77","first-page":"22","volume":"20","author":"JL Leidner","year":"2004","unstructured":"Leidner JL (2004) Towards a reference corpus for automatic toponym resolution evaluation. Workshop on geographic information retrieval, Sheffield, Inderjeet Mani, Janet Hitzeman, Justin Richer, Dave Harris, Rob Quimby, and Ben Wellner 20(2):22\u201323","journal-title":"Workshop on geographic information retrieval, Sheffield, Inderjeet Mani, Janet Hitzeman, Justin Richer, Dave Harris, Rob Quimby, and Ben Wellner"},{"key":"9983_CR78","doi-asserted-by":"crossref","unstructured":"Li W, Hsu CY (2020) Automated terrain feature identification from remote sensing imagery: a deep learning approach. International Journal of Geographical Information Science (2;34(4):637\u201360)","DOI":"10.1080\/13658816.2018.1542697"},{"issue":"3","key":"9983_CR79","doi-asserted-by":"publisher","first-page":"559","DOI":"10.1080\/13658816.2019.1681431","volume":"34","author":"Y Lin","year":"2020","unstructured":"Lin Y, Kang M, Wu Y, Du Q, Liu T (2020) A deep learning architecture for semantic address matching. Int J Geogr Inform Sci 34(3):559\u201376","journal-title":"Int J Geogr Inform Sci"},{"key":"9983_CR80","doi-asserted-by":"crossref","unstructured":"Liu Y, Liu W, Jiang C (2004, July) User interest detection on web pages for building personalized information agent. In International conference on web-age information management (pp. 280-290). Springer, Berlin, Heidelberg","DOI":"10.1007\/978-3-540-27772-9_29"},{"key":"9983_CR81","doi-asserted-by":"publisher","unstructured":"Liu X (2016) Extracting Addresses From News Reports Using Conditional Random Fields. 15th IEEE International conference on machine learning and applications (ICMLA) https:\/\/doi.org\/10.1109\/ICMLA.2016.94","DOI":"10.1109\/ICMLA.2016.94"},{"key":"9983_CR82","doi-asserted-by":"crossref","unstructured":"Ma X, Hovy E, (2016) End-to-end Sequence Labeling via Bi-directional LSTM-CNNs-CRF. Proceedings of the 54th annual meeting of the association for computational linguistics arxiv: abs\/1603.01354","DOI":"10.18653\/v1\/P16-1101"},{"key":"9983_CR83","unstructured":"Machado IMR, Alencar RO De, Oliveira R De, Junior C, Junior CAD (2010) An Ontological Gazetteer for geographic information retrieval. Proceedingd XI GEOINFO, Campos Do Jordao, Brazil, (Hill 2000), 21\u201332"},{"key":"9983_CR84","doi-asserted-by":"publisher","unstructured":"Mandl T, Womser-Hacker C (2005) The effect of named entities on effectiveness in cross-language information retrieval evaluation. Proceedings of the 2005 ACM symposium on Applied computing https:\/\/doi.org\/10.1145\/1066677.1066919","DOI":"10.1145\/1066677.1066919"},{"key":"9983_CR85","unstructured":"McCallum A (2002) Efficiently inducing features of conditional random fields. Proceeding UAI\u201903 proceedings of the nineteenth conference on uncertainty in artificial intelligence, 19(July), 168\u2013175, . https:\/\/dl.acm.org\/citation.cfm?id=2100633"},{"issue":"4","key":"9983_CR86","doi-asserted-by":"publisher","first-page":"528","DOI":"10.1016\/j.ipm.2010.11.008","volume":"47","author":"H Misra","year":"2011","unstructured":"Misra H, Yvon F, Capp\u00e9 O, Jose J (2011) Text segmentation: a topic modeling perspective. Inform Process Manag 47(4):528\u2013544","journal-title":"Inform Process Manag"},{"key":"9983_CR87","doi-asserted-by":"publisher","unstructured":"Morimoto Y, Houle ME, Mccurley KS, Road H, Jose S, Extracting spatial knowledge from the web. In 2003 symposium on applications and the Internet, pp. 326-333 (2003). https:\/\/doi.org\/10.1109\/SAINT.2003.1183066","DOI":"10.1109\/SAINT.2003.1183066"},{"issue":"1","key":"9983_CR88","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1075\/li.30.1.03nad","volume":"30","author":"D Nadeau","year":"2007","unstructured":"Nadeau D, Sekine S (2007) A survey of named entity recognition and classification. Lingvisticae Investigationes 30(1):3\u201326. https:\/\/doi.org\/10.1075\/li.30.1.03nad","journal-title":"Lingvisticae Investigationes"},{"key":"9983_CR89","doi-asserted-by":"publisher","DOI":"10.1007\/11881599","author":"P Nagabhushan","year":"2006","unstructured":"Nagabhushan P, Angadi S, Anami B (2006) A fuzzy symbolic inference system for postal address component extraction and labelling. Fuzzy Syst Knowl Discov. https:\/\/doi.org\/10.1007\/11881599","journal-title":"Fuzzy Syst Knowl Discov"},{"key":"9983_CR90","doi-asserted-by":"publisher","unstructured":"Nesi P, Pantaleo G, Tenti M (2014) Ge(o)Lo(cator): Geographic Information Extraction from Unstructured Text Data and Web Documents. 9th International Workshop on Semantic and Social Media Adaptation and Personalization https:\/\/doi.org\/10.1109\/SMAP.2014.27","DOI":"10.1109\/SMAP.2014.27"},{"key":"9983_CR91","unstructured":"Nicol GT (1993) Flex: the lexical scanner generator. Free Software Foundation"},{"key":"9983_CR92","unstructured":"Nobata C, Sekine S, Isahara H, Grishman R (2002) Summarization system integrated with named entity tdagging and IE pattern Discovery. Proceedings of the Third International conference on language resources and evaluation (LREC\u201902, 1, 1\u20134) http:\/\/pdfs.semanticscholar.org\/c500\/40ac812c3f3le0cf37802ff87de2dce87821.pdf"},{"key":"9983_CR93","unstructured":"Resnik P (1995) Using Information Content to Evaluate Semantic Similarity in a Taxonomy. Proceedings of the 14th international joint conference on Artificial intelligence vol. 1 http:\/\/arxiv.org\/abs\/cmp-lg\/9511007"},{"issue":"15","key":"9983_CR94","doi-asserted-by":"publisher","first-page":"5811","DOI":"10.1016\/j.eswa.2013.05.008","volume":"40","author":"\u00c1 Rodrigo","year":"2013","unstructured":"Rodrigo \u00c1, P\u00e9rez-Iglesias J, Pe\u00f1as A, Garrido G, Araujo L (2013) Answering questions about European legislation. Expert Syst Appl 40(15):5811\u20135816. https:\/\/doi.org\/10.1016\/j.eswa.2013.05.008","journal-title":"Expert Syst Appl"},{"key":"9983_CR95","doi-asserted-by":"publisher","unstructured":"Saad MB, Gan\u00e7arski S (2010, March) Using visual pages analysis for optimizing web archiving. In Proceedings of the 2010 EDBT\/ICDT Workshops (pp. 1-7). https:\/\/doi.org\/10.1145\/1754239.1754287","DOI":"10.1145\/1754239.1754287"},{"key":"9983_CR96","unstructured":"Sagara T, Kitsuregawa M (2001) Yellow Page driven Methods of Collecting and Scoring Spatial Web Documents. SIGIR Workshop on Geographical Information Retrieval (2004). http:\/\/www.geo.unizh.ch\/~rsp\/gir\/"},{"key":"9983_CR97","doi-asserted-by":"publisher","unstructured":"Schmidt S, Manschitz S, Rensing C, Steinmetz R (2013) Extraction of Address Data from Unstructured Text using Free Knowledge Resources. 13th International Conference on Knowledge Management and Knowledge Technologies, At Graz, Austria https:\/\/doi.org\/10.1145\/2494188.2494193","DOI":"10.1145\/2494188.2494193"},{"key":"9983_CR98","unstructured":"Sekine S, Grishman R, Shinnou H (1998) A Decision Tree Method for finding and classifying names in Japanese texts. Proceeding of the 6th workshop on Very Large Corpora, (May), 171\u2013178"},{"key":"9983_CR99","doi-asserted-by":"publisher","first-page":"534","DOI":"10.1109\/ICINFA.2009.5204981","volume":"2009","author":"HJ Song","year":"2009","unstructured":"Song HJ, Park SB, Park SY (2009) An automatic ontology population with a machine learning technique from semi-structured documents. IEEE Int Conf Inform Auto ICIA 2009:534\u2013539. https:\/\/doi.org\/10.1109\/ICINFA.2009.5204981","journal-title":"IEEE Int Conf Inform Auto ICIA"},{"key":"9983_CR100","doi-asserted-by":"publisher","unstructured":"Song R, Liu H, Wen JR, Ma WY (2004, May) Learning block importance models for web pages. In Proceedings of the 13th international conference on World Wide Web (pp. 203-211). https:\/\/doi.org\/10.1145\/988672.988700","DOI":"10.1145\/988672.988700"},{"key":"9983_CR101","doi-asserted-by":"publisher","unstructured":"Souza LA, Davis CA, Borges KAV, Delboni TM (2005) Laender AHF (2005) The role of gazetteers in geographic knowledge discovery on the Web. Proceedings - Third Latin American Web Congress, LA-WEB 2005:157\u2013165. https:\/\/doi.org\/10.1109\/LAWEB.2005.38","DOI":"10.1109\/LAWEB.2005.38"},{"issue":"April","key":"9983_CR102","doi-asserted-by":"publisher","first-page":"41","DOI":"10.1162\/COLI","volume":"38","author":"IG Stab Christian","year":"2017","unstructured":"Stab Christian IG (2017) Parsing argumentation structures in persuasive essays christian. Jurnal Pengurusan 38(April):41\u201351. https:\/\/doi.org\/10.1162\/COLI","journal-title":"Jurnal Pengurusan"},{"key":"9983_CR103","doi-asserted-by":"crossref","unstructured":"Takeuchi K, Collier N (2002) Use of support vector machines in extended named entity recognition. Proceedings of the 6th Conference on Natural Language Learning-Volume 20. Association for Computational Linguistics, 2002., 1\u20137 http:\/\/dl.acm.org\/citation.cfm?id=1118882","DOI":"10.3115\/1118853.1118882"},{"key":"9983_CR104","doi-asserted-by":"crossref","unstructured":"Teitler BE, Lieberman MD, Panozzo D, Sankaranarayanan J, Samet H, Sperling J (2008, November). NewsStand: A new view on news. In Proceedings of the 16th ACM SIGSPATIAL international conference on Advances in geographic information systems (pp. 1-10)","DOI":"10.1145\/1463434.1463458"},{"key":"9983_CR105","doi-asserted-by":"crossref","unstructured":"Tjong EF, Sang K, Meulder F De., Introduction to the CoNLL Shared Task Language Independent Named Entity Recognition. Proceedings of the Seventh Conference on Natural Language Learning at HLT-NAACL (2003)","DOI":"10.3115\/1119176.1119195"},{"issue":"4","key":"9983_CR106","doi-asserted-by":"publisher","first-page":"435","DOI":"10.1111\/j.1467-9671.2010.01203.x","volume":"14","author":"G Touya","year":"2010","unstructured":"Touya G (2010) Quality assessment of the French. Trans GIS 14(4):435\u2013459. https:\/\/doi.org\/10.1111\/j.1467-9671.2010.01203.x","journal-title":"Trans GIS"},{"key":"9983_CR107","unstructured":"Uryupina O (2002) Extracting geographical knowledge from the internet 2002.pdf. Proc. of the ICDM-AM International Workshop on Active Mining - Maebashi, 113\u2013118"},{"key":"9983_CR108","doi-asserted-by":"publisher","unstructured":"Uryupina O (2003) Semi-supervised learning of geographical gazetteers from the internet. Proceedings of the HLTNAACL 2003 Workshop on Analysis of Geographic References, 1, 18\u201325 https:\/\/doi.org\/10.3115\/1119394.1119397","DOI":"10.3115\/1119394.1119397"},{"key":"9983_CR109","doi-asserted-by":"crossref","unstructured":"Vadrevu S, Gelgi F, Davulcu H (2005, November). Semantic partitioning of web pages. In International Conference on Web Information Systems Engineering (pp. 107-118). Springer, Berlin, Heidelberg","DOI":"10.1007\/11581062_9"},{"issue":"81","key":"9983_CR110","doi-asserted-by":"publisher","first-page":"101473","DOI":"10.1016\/j.compenvurbsys.2020.101473","volume":"1","author":"L Xu","year":"2020","unstructured":"Xu L, Du Z, Mao R, Zhang F, Liu R (2020) GSAM: A deep neural network model for extracting computational representations of Chinese addresses fused with geospatial feature. Comput Environ Urban Syst 1(81):101473","journal-title":"Comput Environ Urban Syst"},{"key":"9983_CR111","doi-asserted-by":"publisher","unstructured":"Yu S, Cai D, Wen J-R, Ma W-Y (2004) Improving pseudo-relevance feedback in Web information retrieval using Web page segmentation. Proceedings of the 12th international conference on World Wide Web, 11-18 https:\/\/doi.org\/10.1145\/775152.775155","DOI":"10.1145\/775152.775155"},{"key":"9983_CR112","unstructured":"Yu Z (March, 2007), High accuracy postal address extraction from web pages.In Masters Abstracts International (Vol. 45, No. 05)"},{"key":"9983_CR113","doi-asserted-by":"publisher","unstructured":"Zhang J, Dang Q, Lu Y, Sun S (2013) Suffix tree clustering with named entity recognition. Proceedings - 2013 International Conference on Cloud Computing and Big Data, CLOUDCOM-ASIA 2013, 549\u2013556, https:\/\/doi.org\/10.1109\/CLOUDCOM-ASIA.2013.102","DOI":"10.1109\/CLOUDCOM-ASIA.2013.102"},{"key":"9983_CR114","doi-asserted-by":"publisher","unstructured":"Zhang Y, Gao M, Zhang X, Yang P, Ma Q, Wang C, Hu X (2018) An Automatic Approach to Extracting Geographic Information from Internet. IEEE Access, 3536(c), 1\u20131, (2018). https:\/\/doi.org\/10.1109\/ACCESS.2018.2844470","DOI":"10.1109\/ACCESS.2018.2844470"},{"key":"9983_CR115","doi-asserted-by":"publisher","unstructured":"Zhao S, (2004) Named entity recognition in biomedical texts using an HMM model. Proceedings of the International Joint Workshop on Natural Language Processing in Biomedicine and Its Applications - JNLPBA \u201904, (Grefenstette 1994), 84, https:\/\/doi.org\/10.3115\/1567594.1567613","DOI":"10.3115\/1567594.1567613"},{"issue":"2017","key":"9983_CR116","doi-asserted-by":"publisher","first-page":"59","DOI":"10.1016\/j.neucom.2016.12.075","volume":"257","author":"S Zheng","year":"2017","unstructured":"Zheng S, Hao Y, Lu D, Bao H, Xu J, Hao H, Xu B (2017) Joint entity and relation extraction based on a hybrid neural network. Neurocomputing 257(2017):59\u201366. https:\/\/doi.org\/10.1016\/j.neucom.2016.12.075","journal-title":"Neurocomputing"},{"key":"9983_CR117","doi-asserted-by":"publisher","unstructured":"Zhou G, Su J (2001) Named entity recognition using an HMM-based chunk tagger. Proceedings of the 40th Annual Meeting on Association for Computational Linguistics - ACL \u201902, (July), 473. https:\/\/doi.org\/10.3115\/1073083.1073163","DOI":"10.3115\/1073083.1073163"},{"key":"9983_CR118","doi-asserted-by":"publisher","unstructured":"Zielstra D, Zipf A (2010) A comparative study of proprietary geodata and volunteered geographic information for Germany. 13th AGILE International Conference on Geographic Information Science 2010 Guimar\u00e3es, Portugal, 1, 1\u201315, https:\/\/doi.org\/10.1119\/1.1736005","DOI":"10.1119\/1.1736005"}],"container-title":["Artificial Intelligence Review"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10462-021-09983-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10462-021-09983-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10462-021-09983-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,12,21]],"date-time":"2022-12-21T12:16:21Z","timestamp":1671624981000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10462-021-09983-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,3,14]]},"references-count":118,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2022,2]]}},"alternative-id":["9983"],"URL":"https:\/\/doi.org\/10.1007\/s10462-021-09983-1","relation":{},"ISSN":["0269-2821","1573-7462"],"issn-type":[{"type":"print","value":"0269-2821"},{"type":"electronic","value":"1573-7462"}],"subject":[],"published":{"date-parts":[[2021,3,14]]},"assertion":[{"value":"14 March 2021","order":1,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}