{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:28:25Z","timestamp":1750220905514,"version":"3.41.0"},"publisher-location":"New York, New York, USA","reference-count":26,"publisher":"ACM Press","license":[{"start":{"date-parts":[[2019,1,1]],"date-time":"2019-01-01T00:00:00Z","timestamp":1546300800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019]]},"DOI":"10.1145\/3368926.3369688","type":"proceedings-article","created":{"date-parts":[[2019,12,20]],"date-time":"2019-12-20T13:30:11Z","timestamp":1576848611000},"page":"29-35","source":"Crossref","is-referenced-by-count":5,"title":["Extractive Multi-document Summarization using K-means, Centroid-based Method, MMR, and Sentence Position"],"prefix":"10.1145","author":[{"given":"Hai Cao","family":"Manh","sequence":"first","affiliation":[{"name":"Hanoi University of Science and Technology, Vietnam"}]},{"given":"Huong","family":"Le Thanh","sequence":"additional","affiliation":[{"name":"Hanoi University of Science and Technology, Vietnam"}]},{"given":"Tuan Luu","family":"Minh","sequence":"additional","affiliation":[{"name":"Hanoi University of Science and Technology, Vietnam"}]}],"member":"320","reference":[{"key":"key-10.1145\/3368926.3369688-1","unstructured":"Abhijit Mondal. Understanding Word Vectors and Word2Vec. URL: http:\/\/www.stokastik.in\/understanding-word-vectors-and-word2vec\/. (Last updated: 02 May 2019)."},{"key":"key-10.1145\/3368926.3369688-2","unstructured":"Christopher O. 2015. Understanding LSTM Networks. Retrieved from http:\/\/colah.github.io\/posts\/2015-08-Understanding-LSTMs\/."},{"key":"key-10.1145\/3368926.3369688-3","doi-asserted-by":"crossref","unstructured":"Dragomir R. Radev; Hongyan Jing; Malgorzata Stys; and Daniel Tam. 2004. Centroid-based summarization of multiple documents. In: Inf. Process. Manage., 40(6):919--938","DOI":"10.1016\/j.ipm.2003.10.006"},{"key":"key-10.1145\/3368926.3369688-4","unstructured":"DUC 2007: Task, Documents, and Measures. url: https:\/\/duc.nist.gov\/duc2007\/tasks.html. (Last updated: 02 May 2019)."},{"key":"key-10.1145\/3368926.3369688-5","doi-asserted-by":"crossref","unstructured":"E. Hovy and C.-Y. Lin. 1996. Automated text summarization and the SUMMARIST system. In Proc. of a workshop on held at Baltimore, Maryland, pages 197--214, Baltimore, Maryland.","DOI":"10.3115\/1119089.1119121"},{"key":"key-10.1145\/3368926.3369688-6","doi-asserted-by":"crossref","unstructured":"Gaetano Rossiello, Pierpaolo Basile, Giovanni Semeraro. 2017. Centroid-based Text Summarization through Compositionality of Word Embeddings. Proceedings of the MultiLing 2017 Workshop on Summarization and Summary Evaluation Across Source Types and Genres.","DOI":"10.18653\/v1\/W17-1003"},{"key":"key-10.1145\/3368926.3369688-7","unstructured":"G. Erken and D. R. Radev. 2004. LexPageRank: Prestige in multi-document text summarization. In Proc. of EMTNLP'04, Barcelona, Spain."},{"key":"key-10.1145\/3368926.3369688-8","doi-asserted-by":"crossref","unstructured":"George A. Miller. 1995. Wordnet: a lexical database for English. In: Communications of the ACM 38(11):39--41.","DOI":"10.1145\/219717.219748"},{"key":"key-10.1145\/3368926.3369688-9","unstructured":"Gunes Erkan and Dragomir R. Radev. 2004. LexRank: Graph-based Lexical Centrality as Salience in Text Summarization. In Journal of Artificial Intelligence Research 22 (2004) 457--479."},{"key":"key-10.1145\/3368926.3369688-10","unstructured":"Harshal J. Jain, M. S. Bewoor and S. H. Patil. 2012. Context Sensitive Text Summarization Using K Means Clustering Algorithm. In International Journal of Soft Computing and Engineering."},{"key":"key-10.1145\/3368926.3369688-11","doi-asserted-by":"crossref","unstructured":"Jaime Carbonell and Jade Goldstein. 1998. The Use of MMR, Diversity-Based Reranking for Reordering Documents and Producing Summaries. In Research and Development in Information Retrieval.","DOI":"10.1145\/290941.291025"},{"key":"key-10.1145\/3368926.3369688-12","doi-asserted-by":"crossref","unstructured":"Kaustubh Mani, Ishan Verma, Hardik Meisheri, and Lipika Dey. 2018. Multi-Document Summarization using Distributed Bag-of-Words Model. In: 2018 IEEE\/WIC\/ACM International Conference on Web Intelligence (WI).","DOI":"10.1109\/WI.2018.00-14"},{"key":"key-10.1145\/3368926.3369688-13","unstructured":"Meishan Hu; Aixin Sun; and Ee-Peng Lim. 2008. Comments-oriented document summarization: understanding documents with readers' feedback. In Proc. of the 31st ACM SIGIR, 291--298. ACM."},{"key":"key-10.1145\/3368926.3369688-14","doi-asserted-by":"crossref","unstructured":"M R Prathima, H R Divakar. 2018. Automatic Extractive Text Summarization Using K-Means Clustering. In International Journal of Computer Sciences and Engineering.","DOI":"10.26438\/ijcse\/v6i6.782787"},{"key":"key-10.1145\/3368926.3369688-15","unstructured":"Quoc Le; and Tomas Mikolov. 2014. Distributed representations of sentences and documents. In: In Proceedings of the 31st International Conference on Machine Learning (ICIML-14), pages 1188--1196."},{"key":"key-10.1145\/3368926.3369688-16","unstructured":"Q. Zhou, L. Sun, and J.-Y. Nie. 2005. IS SUM: A multi-document summarizer based on document index graphic and lexical chains. In Proceeding of DUC2005."},{"key":"key-10.1145\/3368926.3369688-17","doi-asserted-by":"crossref","unstructured":"Rachit Arora; and Balaraman Ravindran. 2008. Latent Dirichlet Allocation Based MultiDocument Summarization. In Conference on Information and Knowledge Management.","DOI":"10.1145\/1390749.1390764"},{"key":"key-10.1145\/3368926.3369688-18","unstructured":"R. Barzilay and M. Elhadad. 1997. Using lexical chains for text summarization. In Proc. of the Intelligent Scalable Text Summarization Workshop, Madrid, Spain, 1997."},{"key":"key-10.1145\/3368926.3369688-19","unstructured":"R. Mihalcea and P. Tarau. 2004. TextRank: Bringing order into text. In Proc. of EMNLP'04, pages 404--411, Barcelona, Spain."},{"key":"key-10.1145\/3368926.3369688-20","doi-asserted-by":"crossref","unstructured":"Sergey Brin and Lawrence Page. 1998. The anatomy of a large-scale hypertextual Web search engine. In: Computer Networks and ISDN systems 30(1--7):107--117. 1998.","DOI":"10.1016\/S0169-7552(98)00110-X"},{"key":"key-10.1145\/3368926.3369688-21","unstructured":"Pham Ho&#224;ng Anh. 2019. X&#226;y dung chu'o'ng tr&#236;nh t&#243;m t&#259;t v&#259;rn b&#225;n (ti&#283;g Vi&#283;t) &dstrok;on gi&#225;n v&#243;i Machine Learning. URL: https:\/\/viblo.asia\/p\/xay-dung-chuong-trinh-tom-tat-van-ban-tieng-viet-don-gian-voi-machine-learning-YWOZrgAwlQ0. (Last updated 09\/09\/2019)."},{"key":"key-10.1145\/3368926.3369688-22","doi-asserted-by":"crossref","unstructured":"Radev, Dragomir R. and Jing, Hongyan and Budzikowska, Malgorzata. 2000. Centroid-based summarization of multiple documents: sentence extraction, utility-based evaluation, and user studies. In NAACL-ANLP 2000 Workshop: Automatic Summarization.","DOI":"10.3115\/1117575.1117578"},{"key":"key-10.1145\/3368926.3369688-23","unstructured":"What Is ROUGE And How It Works For Evaluation Of Summarization Tasks? url: https:\/\/rxnlp.com\/how-rouge-works-for-evaluation-of-summarizationtasks\/#.XOO5Z8j7TIW. (Last updated: 02 May 2019)."},{"key":"key-10.1145\/3368926.3369688-24","doi-asserted-by":"crossref","unstructured":"X. Wan and J. Yang. 2007. CollabSum: exploiting multiple document clustering for collaborative single document summarizations. In Proc. of SIGIR'07, pages 143--150, Amsterdam, The Netherlands.","DOI":"10.1145\/1277741.1277768"},{"key":"key-10.1145\/3368926.3369688-25","doi-asserted-by":"crossref","unstructured":"Yihong Gong; and Xin Liu. 2001. Generic text summarization using relevance measure and latent semantic analysis. In Research and Development in Information Retrieval..","DOI":"10.1145\/383952.383955"},{"key":"key-10.1145\/3368926.3369688-26","unstructured":"Zhanying He; Chun Chen; Jiajun Bu; Can Wang; and Lijun Zhang. 2012. Document summarization based on data reconstruction. In Proceedings of AAAI."}],"event":{"number":"10","sponsor":["SOICT, School of Information and Communication Technology - HUST","NAFOSTED, The National Foundation for Science and Technology Development"],"acronym":"SoICT 2019","name":"the Tenth International Symposium","start":{"date-parts":[[2019,12,4]]},"location":"Hanoi, Ha Long Bay, Viet Nam","end":{"date-parts":[[2019,12,6]]}},"container-title":["Proceedings of the Tenth International Symposium on Information and Communication Technology - SoICT 2019"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3368926.3369688","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/dl.acm.org\/ft_gateway.cfm?id=3369688&ftid=2101272&dwn=1","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T23:44:51Z","timestamp":1750203891000},"score":1,"resource":{"primary":{"URL":"http:\/\/dl.acm.org\/citation.cfm?doid=3368926.3369688"}},"subtitle":[],"proceedings-subject":"Information and Communication Technology","short-title":[],"issued":{"date-parts":[[2019]]},"references-count":26,"URL":"https:\/\/doi.org\/10.1145\/3368926.3369688","relation":{},"subject":[],"published":{"date-parts":[[2019]]}}}