{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T04:27:23Z","timestamp":1750307243244,"version":"3.41.0"},"reference-count":55,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2017,5,9]],"date-time":"2017-05-09T00:00:00Z","timestamp":1494288000000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Prog Artif Intell"],"published-print":{"date-parts":[[2017,12]]},"DOI":"10.1007\/s13748-017-0127-3","type":"journal-article","created":{"date-parts":[[2017,5,9]],"date-time":"2017-05-09T20:47:17Z","timestamp":1494362837000},"page":"325-346","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":7,"title":["Applying named entity recognition and co-reference resolution for segmenting English texts"],"prefix":"10.1007","volume":"6","author":[{"given":"Pavlina","family":"Fragkou","sequence":"first","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2017,5,9]]},"reference":[{"key":"127_CR1","doi-asserted-by":"crossref","first-page":"34","DOI":"10.1016\/j.csl.2016.10.003","volume":"43","author":"ZS Abdallah","year":"2017","unstructured":"Abdallah, Z.S., Carman, M., Haffari, G.: Multi-domain evaluation framework for named entity recognition tools. Comput. Speech Lang. 43, 34\u201355 (2017)","journal-title":"Comput. Speech Lang."},{"issue":"3","key":"127_CR2","first-page":"161","volume":"12","author":"DE Appelt","year":"1999","unstructured":"Appelt, D.E.: Introduction to information extraction. J. AI Commun. Arch. 12(3), 161\u2013172 (1999)","journal-title":"J. AI Commun. Arch."},{"key":"127_CR3","unstructured":"Appelt, D.E., Hobbs, J.R., Bear, J., Israel, D.J., Tyson, M.: Fastus: a finite-state processor for information extraction from real-world text. In: Proceeding of the IJCAI\u201993, pp. 1172\u20131178 (1993)"},{"key":"127_CR4","doi-asserted-by":"crossref","unstructured":"Atda\u011f, S., Labatut, V.: A Comparison of named entity recognition tools applied to biographical texts. In: Proceedings of the 2nd International Conference on Systems and Computer Science, Villeneuve d\u2019Ascq (FR), pp. 228\u2013233 (2013)","DOI":"10.1109\/IcConSCS.2013.6632052"},{"key":"127_CR5","first-page":"8","volume":"46","author":"A Alajmi","year":"2012","unstructured":"Alajmi, A., Saad, E.M., Darwish, R.R.: Towards an ARABIC stop-words list generation. Int. J. Comput. Appl. 46, 8 (2012)","journal-title":"Int. J. Comput. Appl."},{"key":"127_CR6","unstructured":"Barzilay, R., Lapata, M.: Automatic evaluation of text coherence: models and representations. In: Proceedings of the 19th International Joint Conference on Artificial Intelligence (IJCAI\u201905), pp. 1085\u20131090 (2005)"},{"key":"127_CR7","doi-asserted-by":"crossref","unstructured":"Barzilay, R., Lapata, M.: Modeling local coherence: an entity-based approach. In: Proceedings of the 43rd Annual Meeting on Association for Computational Linguistics, pp. 141\u2013148 (2005)","DOI":"10.3115\/1219840.1219858"},{"issue":"1","key":"127_CR8","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1162\/coli.2008.34.1.1","volume":"34","author":"R Barzilay","year":"2008","unstructured":"Barzilay, R., Lapata, M.: Modeling local coherence: an entity-based approach. Comput. Linguist. 34(1), 1\u201334 (2008)","journal-title":"Comput. Linguist."},{"key":"127_CR9","doi-asserted-by":"crossref","first-page":"177","DOI":"10.1023\/A:1007506220214","volume":"34","author":"D Beeferman","year":"1999","unstructured":"Beeferman, D., Berger, A., Lafferty, J.: Statistical models for text segmentation. Mach. Learn. 34, 177\u2013210 (1999)","journal-title":"Mach. Learn."},{"key":"127_CR10","doi-asserted-by":"crossref","unstructured":"Bengtson, E., Roth, D.: Understanding the value of features for co-reference resolution. In: Proceedings of EMNLP \u201908 Conference on Empirical Methods in Natural Language Processing, pp. 294\u2013303 (2008)","DOI":"10.3115\/1613715.1613756"},{"key":"127_CR11","doi-asserted-by":"crossref","first-page":"5","DOI":"10.1162\/coli.2006.32.1.5","volume":"1","author":"Y Bestgen","year":"2006","unstructured":"Bestgen, Y.: Improving text segmentation using latent semantic analysis: A reanalysis of Choi, Wiemer-Hastings Deterministic and Moore (2001). Comput. Linguist. 1, 5\u201312 (2006)","journal-title":"Comput. Linguist."},{"key":"127_CR12","doi-asserted-by":"crossref","unstructured":"Brando, C., Domingu\u00e8s, C., Capeyron, M.: Evaluation of NER systems for the recognition of place mentions in French thematic corpora. In: Proceedings of the 10th Workshop on Geographic Information Retrieval, pp. 7:1\u20137:10 (2016)","DOI":"10.1145\/3003464.3003471"},{"key":"127_CR13","unstructured":"Choi, F.Y.Y.: Advances in domain independent linear text segmentation. In: Proceeding of the 1st Meeting of the North American Chapter of the ACL, pp. 26\u201333 (2000)"},{"key":"127_CR14","unstructured":"Choi, F.Y.Y., Wiemer-Hastings, P., Moore, J.: Latent semantic analysis for text segmentation. In: Proceeding 6th Conference on EMNLP, pp. 109\u2013117 (2001)"},{"key":"127_CR15","unstructured":"Cunningham, H., Maynard, D., Bontcheva, K., Tablan, V., Aswani, N., Roberts, I.: Text Processing with GATE (version 6). The University of Sheffield. http:\/\/tinyurl.com\/gatebook (2011)"},{"key":"127_CR16","doi-asserted-by":"crossref","unstructured":"Day, D., Aberdeen, J., Hirschman, L., Kozierok, R., Robinson, P., Vilain, M.: Mixed-initiative development of language processing systems. In: Proceedings of the 5th Conference on Applied Natural Language Processing (ANLP-97) (1997)","DOI":"10.3115\/974557.974608"},{"key":"127_CR17","unstructured":"Dlugolinsk\u00fd, S., Krammer, P., Ciglan, M., Laclav\u00edk, M., Hluch\u00fd, L.: Combining Named Entity Recognition Tools. In: 3rd Workshop on \u2018Making Sense of Microposts\u2019, (#MSM2013) World Wide Web Conference (2013)"},{"key":"127_CR18","doi-asserted-by":"crossref","unstructured":"Eisenstein, J., Barzilay, R.: Bayesian unsupervised topic segmentation. In: Proceedings of the 2008 Conference on Empirical Methods in Natural Language Processing, pp. 334\u2013343 (2008)","DOI":"10.3115\/1613715.1613760"},{"key":"127_CR19","unstructured":"Fragkou, P.: A comparison of information extraction and text segmentation for web content mining. In: Proceedings of 4th Language & Technology Conference: Human Language Technologies as a Challenge for Computer Science and Linguistics (LTC 2009), pp. 482\u2013486 (2009)"},{"key":"127_CR20","doi-asserted-by":"crossref","unstructured":"Grishman, R.: Information extraction: techniques and challenges. In: Pazienza, M.T. (ed.) Information Extraction: A Multidisciplinary Approach to an Emergine Information Technology (International Summer School SCIE-97), pp. 10\u201327. Springer, Frascatti (1997)","DOI":"10.1007\/3-540-63438-X_2"},{"issue":"1","key":"127_CR21","first-page":"33","volume":"23","author":"MA Hearst","year":"1997","unstructured":"Hearst, M.A.: TextTiling: segmenting text into multi-paragraph subtopic passages. Comput. Linguist. 23(1), 33\u201364 (1997)","journal-title":"Comput. Linguist."},{"key":"127_CR22","doi-asserted-by":"crossref","unstructured":"Heinonen, O.: Optimal multi-paragraph text segmentation by dynamic programming. In: Proceeding of the 17th COLING-ACL\u201998, pp. 1484\u20131486 (1998)","DOI":"10.3115\/980691.980814"},{"key":"127_CR23","doi-asserted-by":"crossref","unstructured":"Jiang, R., Banchs, R.E., Li, H.: Evaluating and combining named entity recognition systems. In: Proceedings of the Sixth Named Entity Workshop, Joint with 54th Association for Computational Linguistics, pp. 21\u201327, Berlin, Germany (2016)","DOI":"10.18653\/v1\/W16-2703"},{"key":"127_CR24","unstructured":"Kazantseva, A., Szpakowicz, S.: Topical segmentation: a study of human performance and a new measure of quality. In: Proceedings of the 2012 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, pp. 211\u2013220 (2012)"},{"key":"127_CR25","unstructured":"Kazantseva, A., Szpakowicz, S.: Linear text segmentation using affinity propagation. In: Proceedings of the 2011 Conference on Empirical Methods in Natural Language Processing, pp. 284\u2013293 (2011)"},{"key":"127_CR26","doi-asserted-by":"crossref","first-page":"209","DOI":"10.1016\/S0895-7177(04)90008-8","volume":"39","author":"A Kehagias","year":"2004","unstructured":"Kehagias, A., Nicolaou, A., Fragkou, P., Petridis, V.: Text segmentation by product partition models and dynamic programming. Math. Comput. Model. 39, 209\u2013217 (2004)","journal-title":"Math. Comput. Model."},{"key":"127_CR27","doi-asserted-by":"crossref","unstructured":"Kern, R., Granitzer, M.: Efficient linear text segmentation based on information retrieval techniques. In: Proceeding of the International Conference on Management of Emergent Digital EcoSystems (2009)","DOI":"10.1145\/1643823.1643854"},{"key":"127_CR28","doi-asserted-by":"crossref","unstructured":"Lamprier, S., Amghar, T., Levrat, B., Saubion, F.: On evaluation methodologies for text segmentation algorithms. In: Proceedings of the 19th IEEE International Conference on Tools with Artificial Intelligence, vol. 2, pp. 19\u201326 (2007)","DOI":"10.1109\/ICTAI.2007.22"},{"key":"127_CR29","first-page":"199","volume-title":"WordNet: An Electronic Lexical Database","author":"S Landes","year":"1998","unstructured":"Landes, S., Leacock, C., Fellbaum, C.: Building semantic concordances. In: Fellbaum, C. (ed.) WordNet: An Electronic Lexical Database, pp. 199\u2013216. MIT Press, Cambridge (1998)"},{"issue":"4","key":"127_CR30","doi-asserted-by":"crossref","first-page":"885","DOI":"10.1162\/COLI_a_00152","volume":"39","author":"H Lee","year":"2013","unstructured":"Lee, H., Chang, A., Peirsman, Y., Chambers, N., Surdeanu, M., Jurafsky, D.: Deterministic co- reference resolution based on entity-centric, precision-ranked rules. Comput. Linguist. 39(4), 885\u2013916 (2013)","journal-title":"Comput. Linguist."},{"key":"127_CR31","doi-asserted-by":"crossref","unstructured":"Litman, D., Passonneau, R.J.: Combining multiple knowledge sources for discourse segmentation. In: Proceedings of the 33rd Annual Meeting of the Association for Computational Linguistic, pp. 108\u2013115 (1995)","DOI":"10.3115\/981658.981673"},{"key":"127_CR32","unstructured":"Litman, D., Passonneau, R.J.: Developing algorithms for discourse segmentation. In: Proceedings of the AAAI 1995 Spring Symposium Series: Empirical Methods in Discourse Interpretation and Generation, pp. 85\u201391 (1995)"},{"key":"127_CR33","doi-asserted-by":"crossref","unstructured":"Malioutov, I., Barzilay, R.: Minimum cut model for spoken lecture segmentation. In: Proceedings of the 21st International Conference on Computational Linguistics and 44th Annual Meeting of the Association for Computational Linguistics, pp. 25\u201332 (2006)","DOI":"10.3115\/1220175.1220179"},{"key":"127_CR34","unstructured":"Marrero, M., S\u00e1nchez-Cuadrado, S., Morato Lara, J. Andreadakis, G.: Evaluation of named entity extraction systems. In: Advances in Computational Linguistics, Research in Computing Science, pp. 41\u201347 (2009)"},{"key":"127_CR35","unstructured":"Muller, C., Strube, M.: Multi-level annotation of linguistic data with MMAX2, corpus technology and language pedagogy. In: Braun, S., Kohn, K., Mukherjee, J. (eds.) New Resources, New Tools, New Methods. English Corpus Linguistics, vol. 3, pp. 197\u2013214 (2006)"},{"key":"127_CR36","doi-asserted-by":"crossref","unstructured":"Ogren, P.V.: Knowtator: A Protege plug-in for annotated corpus construction. In: Human Language Technology Conference Proceedings of the 2006 Conference of the North American Chapter of the Association for Computational Linguistics on Human Language Technology, pp. 273\u2013275 (2006)","DOI":"10.3115\/1225785.1225791"},{"issue":"1","key":"127_CR37","doi-asserted-by":"crossref","first-page":"19","DOI":"10.1162\/089120102317341756","volume":"28","author":"L Pevzner","year":"2002","unstructured":"Pevzner, L., Hearst, M.: A critique and improvement of an evaluation metric for text segmentation. Comput. Linguist. 28(1), 19\u201336 (2002)","journal-title":"Comput. Linguist."},{"key":"127_CR38","unstructured":"Pinto, A., Oliveira, H.G., Alves, A.O.: Comparing the performance of different NLP toolkits in formal and social media text. In: Proceedings of the 5th Symposium on Languages, Applications and Technologies (SLATE\u201916), pp. 1\u201316, OpenAccess Series in Informatics (OASIcs), ISBN 978-3-95977-006-4 (2016)"},{"issue":"3","key":"127_CR39","doi-asserted-by":"crossref","first-page":"130","DOI":"10.1108\/eb046814","volume":"14","author":"MF Porter","year":"1980","unstructured":"Porter, M.F.: An algorithm for suffix stripping. Program 14(3), 130\u2013137 (1980)","journal-title":"Program"},{"key":"127_CR40","doi-asserted-by":"crossref","unstructured":"Qi, S., Runxin, L., Dingsheng, L., Xihong, W.: Text segmentation with LDA-based fisher kernel. In: Proceeding of the 46th Annual Meeting of the Association for Computational Linguistics on Human Language Technologies, pp. 269\u2013272 (2008)","DOI":"10.3115\/1557690.1557768"},{"key":"127_CR41","doi-asserted-by":"crossref","unstructured":"Ratinov L., Roth, D.: Design challenges and misconceptions in named entity recognition. In: Proceeding CoNLL \u201909 Proceedings of the Thirteenth Conference on Computational Natural Language Learning, pp. 147\u2013155 (2009)","DOI":"10.3115\/1596374.1596399"},{"key":"127_CR42","unstructured":"Rodriquez, K.J., Bryant, M., Blanke, T., Luszczynska, M.: Comparison of named entity recognition tools for raw OCR text. In: Proceedings of KONVENS, pp. 410\u2013414 (2012)"},{"issue":"10","key":"127_CR43","doi-asserted-by":"crossref","first-page":"944","DOI":"10.1002\/(SICI)1097-4571(1999)50:10<944::AID-ASI9>3.0.CO;2-Q","volume":"50","author":"J Savoy","year":"1999","unstructured":"Savoy, J.: A stemming procedure and stopword list for general French corpora. J. Am. Soc. Inf. Sci. 50(10), 944\u2013952 (1999)","journal-title":"J. Am. Soc. Inf. Sci."},{"key":"127_CR44","unstructured":"Scaiano, M., Inkpen, D.: Getting more from segmentation evaluation. In: Proceedings of the Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, pp. 362\u2013366 (2012)"},{"key":"127_CR45","unstructured":"Siefkes, C.: An Incrementally Trainable Statistical Approach to Information Extraction Based on Token Classification and Rich Context Models. Ph.D. Thesis (2007)"},{"key":"127_CR46","doi-asserted-by":"crossref","unstructured":"Singh, S., Riedel, S., Martin, B., Zheng, J., McCallum, A.: Joint inference of entities, relations, and co-reference. In: Proceedings of the 2013 Workshop on Automated Knowledge Base Construction. CIKM\u201913 22nd ACM International Conference on Information and Knowledge Management, pp. 1\u20136 (2013)","DOI":"10.1145\/2509558.2509559"},{"key":"127_CR47","doi-asserted-by":"crossref","unstructured":"Simon, A., Gravier, G., Sebillot, P.: Leveraging lexical cohesion and disruption for topic segmentation. In: Proceedings of the 2013 Conference on Empirical Methods in Natural Language Processing, pp. 1314\u20131324 (2013)","DOI":"10.18653\/v1\/D13-1130"},{"key":"127_CR48","unstructured":"Sitbon L., Bellot, P.: Segmentation thematique par chaines lexicales ponderees. In: Proceedings of 12th Conference on Natural Language Processing (TALN 2005)"},{"key":"127_CR49","doi-asserted-by":"crossref","unstructured":"Stoyanov, V., Cardie, C., Gilbert, N., Riloff, E., Buttler, D. Hysom, D. : Reconcile: A Co-reference Resolution Platform. Technical Report, Cornell University (2010)","DOI":"10.2172\/970156"},{"key":"127_CR50","doi-asserted-by":"crossref","unstructured":"Utiyama, M., Isahara, H.: A statistical model for domain independent text segmentation. In: Proceedings of the 9th EACL, pp. 491\u2013498 (2001)","DOI":"10.3115\/1073012.1073076"},{"key":"127_CR51","doi-asserted-by":"crossref","unstructured":"Versley, Y., Ponzetto, S.P., Poesio, M., Eidelman, V., Jern, A., Smith, J., Yang, X., Moschitti, A.: BART: A modular toolkit for co-reference resolution. In: Proceedings of the 6th International Conference on Language Resources and Evaluation (LREC 2008) (2008)","DOI":"10.3115\/1564144.1564147"},{"key":"127_CR52","unstructured":"Xiang, J., Hongyuan, Z.: Domain-independent text segmentation using anisotropic diffusion and dynamic programming. In: Proceeding of the 26th ACM SIGIR Conference (2003)"},{"key":"127_CR53","doi-asserted-by":"crossref","unstructured":"Yao, L., Reidel, S., McCallum, A.: Universal schema for entity type prediction. In: The Third International Workshop on Automated Knowledge Base Construction (AKBC) (2013)","DOI":"10.1145\/2509558.2509572"},{"key":"127_CR54","unstructured":"Ye, N., Zhu, J., Luo, H., Wang, H., Zhang, B.: Improvement of the dotplotting method for linear text segmentation. In: Proceeding of the Natural Language Processing and Knowledge Engineering, pp. 636\u2013641 (2005)"},{"key":"127_CR55","unstructured":"Yu, K., Li, Z., Guan, G., Wang, Z., Feng, D.: Unsupervised text segmentation using LDA and MCMC. In: Proceedings of the Tenth Australasian Data Mining Conference (AusDM 2012), Sydney, Australia (2012)"}],"container-title":["Progress in Artificial Intelligence"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s13748-017-0127-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s13748-017-0127-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s13748-017-0127-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T10:51:12Z","timestamp":1750243872000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s13748-017-0127-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,5,9]]},"references-count":55,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2017,12]]}},"alternative-id":["127"],"URL":"https:\/\/doi.org\/10.1007\/s13748-017-0127-3","relation":{},"ISSN":["2192-6352","2192-6360"],"issn-type":[{"type":"print","value":"2192-6352"},{"type":"electronic","value":"2192-6360"}],"subject":[],"published":{"date-parts":[[2017,5,9]]}}}