{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,8]],"date-time":"2026-05-08T05:38:39Z","timestamp":1778218719867,"version":"3.51.4"},"reference-count":35,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2020,6,25]],"date-time":"2020-06-25T00:00:00Z","timestamp":1593043200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,6,25]],"date-time":"2020-06-25T00:00:00Z","timestamp":1593043200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"funder":[{"name":"Ho Chi Minh City Department of Science and Technology","award":["15\/2016\/H\u0110-SKHCN"],"award-info":[{"award-number":["15\/2016\/H\u0110-SKHCN"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Lang Resources &amp; Evaluation"],"published-print":{"date-parts":[[2020,12]]},"DOI":"10.1007\/s10579-020-09495-4","type":"journal-article","created":{"date-parts":[[2020,6,25]],"date-time":"2020-06-25T21:02:22Z","timestamp":1593118942000},"page":"893-920","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":15,"title":["ViMs: a high-quality Vietnamese dataset for abstractive multi-document summarization"],"prefix":"10.1007","volume":"54","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-2118-203X","authenticated-orcid":false,"given":"Nhi-Thao","family":"Tran","sequence":"first","affiliation":[]},{"given":"Minh-Quoc","family":"Nghiem","sequence":"additional","affiliation":[]},{"given":"Nhung T. H.","family":"Nguyen","sequence":"additional","affiliation":[]},{"given":"Ngan Luu-Thuy","family":"Nguyen","sequence":"additional","affiliation":[]},{"given":"Nam","family":"Van Chi","sequence":"additional","affiliation":[]},{"given":"Dien","family":"Dinh","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2020,6,25]]},"reference":[{"key":"9495_CR1","unstructured":"Benikova, D., Mieskes, M., Meyer, C.M., & Gurevych, I. (2016). Bridging the gap between extractive and abstractive summaries: Creation and evaluation of coherent extracts from heterogeneous sources. In Proceedings of COLING 2016, the 26th International Conference on Computational Linguistics: Technical Papers (pp. 1039\u20131050)."},{"key":"9495_CR2","unstructured":"Dang, H.T. (2005). Overview of DUC 2005. In Proceedings of the document understanding conference (vol. 2005, pp. 1\u201312)."},{"key":"9495_CR3","unstructured":"Dang, H.T., & Owczarzak, K. (2008). Overview of the TAC 2008 opinion question answering and summarization tasks. In Proceedings of the First Text Analysis Conference (vol. 2)."},{"issue":"2","key":"9495_CR4","doi-asserted-by":"publisher","first-page":"264","DOI":"10.1145\/321510.321519","volume":"16","author":"HP Edmundson","year":"1969","unstructured":"Edmundson, H. P. (1969). New methods in automatic extracting. Journal of the ACM (JACM), 16(2), 264\u2013285.","journal-title":"Journal of the ACM (JACM)"},{"key":"9495_CR5","unstructured":"Giannakopoulos, G. (2013) Multi-document multilingual summarization and evaluation tracks in acl 2013 multiling workshop. In Proceedings of the MultiLing 2013 Workshop on Multilingual Multi-document Summarization (pp. 20\u201328)."},{"issue":"3","key":"9495_CR6","first-page":"5","volume":"5","author":"G Giannakopoulos","year":"2008","unstructured":"Giannakopoulos, G., Karkaletsis, V., Vouros, G., & Stamatopoulos, P. (2008). Summarization system evaluation revisited: N-gram graphs. ACM Transactions on Speech and Language Processing (TSLP), 5(3), 5.","journal-title":"ACM Transactions on Speech and Language Processing (TSLP)"},{"key":"9495_CR7","unstructured":"Giannakopoulos, G., El-Haj, M., Favre, B., Litvak, M., Steinberger, J., & Varma, V. (2011). TAC 2011 MultiLing pilot overview."},{"key":"9495_CR8","doi-asserted-by":"crossref","unstructured":"Giannakopoulos, G., Kubina, J., Conroy, J., Steinberger, J., Favre, B., Kabadjov, M., Kruschwitz, U., & Poesio, M. (2015). MultiLing 2015: multilingual summarization of single and multi-documents, on-line fora, and call-center conversations. In Proceedings of the 16th Annual Meeting of the Special Interest Group on Discourse and Dialogue (pp. 270\u2013274).","DOI":"10.18653\/v1\/W15-4638"},{"key":"9495_CR9","doi-asserted-by":"crossref","unstructured":"Giannakopoulos, G., Conroy, J., Kubina, J., Rankel, P.A., Lloret, E., Steinberger, J., Litvak, M., & Favre, B. (2017). MultiLing 2017 overview. In Proceedings of the MultiLing 2017 workshop on summarization and summary evaluation across source types and genres (pp. 1\u20136).","DOI":"10.18653\/v1\/W17-1001"},{"key":"9495_CR40","doi-asserted-by":"crossref","unstructured":"Goldstein J, Mittal V, Carbonell J, Callan J (2000) Creating and evaluating multi-document sentence extract summaries. In Proceedings of the ninth international conference on information and knowledge management (CIKM) McLean, VA, USA, pp  165\u2013172.","DOI":"10.1145\/354756.354815"},{"key":"9495_CR11","doi-asserted-by":"crossref","unstructured":"Hong\u00a0Phuong, L., Thi Minh\u00a0Huyen, N., Roussanaly, A., & Vinh, H.T. (2008). A hybrid approach to word segmentation of Vietnamese texts. In International Conference on Language and Automata Theory and Applications (pp. 240\u2013249). Springer.","DOI":"10.1007\/978-3-540-88282-4_23"},{"key":"9495_CR12","unstructured":"Jaidka, K., Chandrasekaran, M.K., Elizalde, B.F., Jha, R., Jones, C., Kan, M.Y., Khanna, A., Molla-Aliod, D., Radev, D.R., Ronzano, F., et al. (2014). The computational linguistics summarization pilot task. In Proceedings of Text Ananlysis Conference, Gaithersburg, USA."},{"key":"9495_CR13","unstructured":"Ji, H., Grishman, R., Dang, H.T., Griffitt, K., & Ellis, J. (2010). Overview of the TAC 2010 knowledge base population track. In Third Text Analysis Conference (vol. 3, pp. 3\u20133)."},{"key":"9495_CR14","unstructured":"Jing, H., Barzilay, R., McKeown, K., & Elhadad, M. (1998). Summarization evaluation methods: Experiments and analysis. In AAAI symposium on intelligent summarization, Palo Alto, CA (pp. 51\u201359)."},{"key":"9495_CR15","doi-asserted-by":"publisher","first-page":"159","DOI":"10.2307\/2529310","volume":"33","author":"JR Landis","year":"1977","unstructured":"Landis, J. R., & Koch, G. G. (1977). The measurement of observer agreement for categorical data. Biometrics, 33, 159\u2013174.","journal-title":"Biometrics"},{"key":"9495_CR16","doi-asserted-by":"crossref","unstructured":"Le, T., Nguyen, L.M., Shimazu, A., & Dien, D. (2016) Phrase-based compressive summarization for English-Vietnamese. In International Symposium on Integrated Uncertainty in Knowledge Modelling and Decision Making (pp. 331\u2013342). Springer.","DOI":"10.1007\/978-3-319-49046-5_28"},{"key":"9495_CR17","unstructured":"Lin, C.Y. (2004). Rouge: A package for automatic evaluation of summaries. In Text summarization branches out: Proceedings of the ACL-04 workshop, Barcelona, Spain (vol. 8)."},{"key":"9495_CR18","doi-asserted-by":"crossref","unstructured":"Litvak, M., Vanetik, N., Last, M., & Churkin, E. (2016). Museec: a multilingual text summarization tool. In Proceedings of ACL-2016 System Demonstrations (pp. 73\u201378).","DOI":"10.18653\/v1\/P16-4013"},{"key":"9495_CR19","doi-asserted-by":"crossref","unstructured":"Liu, F., & Liu, Y. (2008). Correlation between rouge and human evaluation of extractive meeting summaries. In Proceedings of the 46th annual meeting of the association for computational linguistics on human language technologies: Short papers, Association for Computational Linguistics (pp. 201\u2013204).","DOI":"10.3115\/1557690.1557747"},{"issue":"1","key":"9495_CR20","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s10462-011-9216-z","volume":"37","author":"E Lloret","year":"2012","unstructured":"Lloret, E., & Palomar, M. (2012). Text summarisation in progress: a literature review. Artificial Intelligence Review, 37(1), 1\u201341.","journal-title":"Artificial Intelligence Review"},{"key":"9495_CR41","unstructured":"Loupy C, Guegan M, Ayache C, Seng S, Torres Moreno J-M (2010) A French human reference corpus for multi-document summarization and sentence compression. In Proceedings of the seventh international conference on language resources and evaluation (LREC), Valletta, Malta, pp 3113\u20133118"},{"issue":"1","key":"9495_CR21","doi-asserted-by":"publisher","first-page":"43","DOI":"10.1017\/S1351324901002741","volume":"8","author":"I Mani","year":"2002","unstructured":"Mani, I., Klein, G., House, D., Hirschman, L., Firmin, T., & Sundheim, B. (2002). SUMMAC: a text summarization evaluation. Natural Language Engineering, 8(1), 43\u201368.","journal-title":"Natural Language Engineering"},{"key":"9495_CR22","doi-asserted-by":"crossref","unstructured":"Meyer, C.M., Benikova, D., Mieskes, M., & Gurevych, I. (2016). MDSWriter: Annotation tool for creating high-quality multi-document summarization corpora. In Proceedings of ACL-2016 System Demonstrations (pp. 97\u2013102).","DOI":"10.18653\/v1\/P16-4017"},{"key":"9495_CR23","unstructured":"Mihalcea, R., & Tarau, P. (2004) Textrank: Bringing order into text. In Proceedings of the 2004 conference on empirical methods in natural language processing."},{"key":"9495_CR25","doi-asserted-by":"crossref","unstructured":"Nenkova, A., Siddharthan, A., & McKeown, K. (2005) Automatically learning cognitive status for multi-document summarization of newswire. In Proceedings of the conference on human language technology and empirical methods in natural language processing, Association for Computational Linguistics (pp. 241\u2013248).","DOI":"10.3115\/1220575.1220606"},{"issue":"2","key":"9495_CR26","doi-asserted-by":"publisher","first-page":"4","DOI":"10.1145\/1233912.1233913","volume":"4","author":"A Nenkova","year":"2007","unstructured":"Nenkova, A., Passonneau, R., & McKeown, K. (2007). The pyramid method: Incorporating human content selection variation in summarization evaluation. ACM Transactions on Speech and Language Processing (TSLP), 4(2), 4.","journal-title":"ACM Transactions on Speech and Language Processing (TSLP)"},{"key":"9495_CR27","doi-asserted-by":"crossref","unstructured":"Nguyen, H.N., Van\u00a0Le, T., Le, H.S., & Pham, T.V. (2014). Domain specific sentiment dictionary for opinion mining of Vietnamese text. In International Workshop on Multi-disciplinary Trends in Artificial Intelligence (pp. 136\u2013148). Springer.","DOI":"10.1007\/978-3-319-13365-2_13"},{"key":"9495_CR28","unstructured":"Nguyen, M.T., Lai, D.V., Do, P.K., Tran, D.V., & Nguyen, M.L. (2016). VSoLSCSum: Building a Vietnamese sentence-comment dataset for social context summarization. In Proceedings of the 12th Workshop on Asian Language Resources (ALR12) (pp. 38\u201348)."},{"key":"9495_CR29","doi-asserted-by":"crossref","unstructured":"Nguyen, T.C., Le, H.M., & Phan, T.T. (2009). Building knowledge base for Vietnamese information retrieval. In Proceedings of the 11th International Conference on Information Integration and Web-based Applications & Services (pp. 482\u2013486). ACM.","DOI":"10.1145\/1806338.1806428"},{"key":"9495_CR30","doi-asserted-by":"publisher","first-page":"240","DOI":"10.1098\/rspl.1895.0041","volume":"58","author":"K Pearson","year":"1895","unstructured":"Pearson, K. (1895). Note on regression and inheritance in the case of two parents. Proceedings of the Royal Society of London, 58, 240\u2013242.","journal-title":"Proceedings of the Royal Society of London"},{"key":"9495_CR31","doi-asserted-by":"crossref","unstructured":"Radev, D.R., Teufel, S., Saggion, H., Lam, W., Blitzer, J., Qi, H., Celebi, A., Liu, D., & Drabek, E. (2003). Evaluation challenges in large-scale document summarization. In Proceedings of the 41st Annual Meeting on Association for Computational Linguistics-Volume 1, Association for Computational Linguistics (pp. 375\u2013382).","DOI":"10.3115\/1075096.1075144"},{"key":"9495_CR32","unstructured":"Seki, Y., Eguchi, K., Kando, N., Aono, M. (2005). Multi-document summarization with subjectivity analysis at DUC 2005. In Proceedings of the Document Understanding Conference (DUC)."},{"key":"9495_CR33","doi-asserted-by":"crossref","unstructured":"Ung, V.G., Luong, A.V., Tran, N.T., & Nghiem, M.Q. (2015). Combination of features for Vietnamese news multi-document summarization. In Knowledge and Systems Engineering (KSE), 2015 Seventh International Conference on, IEEE (pp. 186\u2013191).","DOI":"10.1109\/KSE.2015.71"},{"key":"9495_CR34","first-page":"1","volume":"52","author":"S Verberne","year":"2017","unstructured":"Verberne, S., Krahmer, E., Hendrickx, I., Wubben, S., & van Den Bosch, A. (2017). Creating a reference data set for the summarization of discussion forum threads. Language Resources and Evaluation, 52, 1\u201323.","journal-title":"Language Resources and Evaluation"},{"issue":"3","key":"9495_CR35","first-page":"243","volume":"8","author":"M William","year":"1988","unstructured":"William, M., & Thompson, S. (1988). Rhetorical structure theory: towards a functional theory of text organization. Text, 8(3), 243\u2013281.","journal-title":"Text"}],"container-title":["Language Resources and Evaluation"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10579-020-09495-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10579-020-09495-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10579-020-09495-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,6,24]],"date-time":"2021-06-24T23:41:41Z","timestamp":1624578101000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10579-020-09495-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,6,25]]},"references-count":35,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2020,12]]}},"alternative-id":["9495"],"URL":"https:\/\/doi.org\/10.1007\/s10579-020-09495-4","relation":{},"ISSN":["1574-020X","1574-0218"],"issn-type":[{"value":"1574-020X","type":"print"},{"value":"1574-0218","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,6,25]]},"assertion":[{"value":"25 June 2020","order":1,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}