{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,27]],"date-time":"2026-02-27T07:06:11Z","timestamp":1772175971796,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":16,"publisher":"ACM","license":[{"start":{"date-parts":[[2021,1,16]],"date-time":"2021-01-16T00:00:00Z","timestamp":1610755200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"DOI":"10.13039\/501100004663","name":"Ministry of Science and Technology, Taiwan","doi-asserted-by":"publisher","award":["MOST109-2221-E-035-064"],"award-info":[{"award-number":["MOST109-2221-E-035-064"]}],"id":[{"id":"10.13039\/501100004663","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2021,1,16]]},"DOI":"10.1145\/3474944.3474958","type":"proceedings-article","created":{"date-parts":[[2021,10,15]],"date-time":"2021-10-15T14:38:28Z","timestamp":1634308708000},"page":"82-87","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":1,"title":["Using Spark for Text Mining on Large Scale Liver Cancer Literature"],"prefix":"10.1145","author":[{"given":"Ming-Yen","family":"Lin","sequence":"first","affiliation":[{"name":"Feng Chia University, Taiwan"}]},{"given":"Yu-Ju","family":"Lin","sequence":"additional","affiliation":[{"name":"Feng Chia University, Taiwan"}]},{"given":"Sue-Chen","family":"Hsueh","sequence":"additional","affiliation":[{"name":"Chaoyang University of Technology, Taiwan"}]}],"member":"320","published-online":{"date-parts":[[2021,10,15]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"Retrieved","author":"Statistics","year":"2016","unstructured":"Statistics of Death for Year 2016 in Taiwan . Retrieved August 28, 2017, from http:\/\/www.mohw.gov.tw\/cp-16-33598-1.html. Statistics of Death for Year 2016 in Taiwan. Retrieved August 28, 2017, from http:\/\/www.mohw.gov.tw\/cp-16-33598-1.html."},{"key":"e_1_3_2_1_2_1","volume-title":"Retrieved","author":"Apache Spark\u2122","year":"2017","unstructured":"Apache Spark\u2122 Lightning-fast cluster computing . Retrieved August 28, 2017 , from https:\/\/spark.apache.org\/. Apache Spark\u2122 Lightning-fast cluster computing. Retrieved August 28, 2017, from https:\/\/spark.apache.org\/."},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"crossref","unstructured":"Cortes C. & Vapnik V. (1995 September). Support-vector networks. Machine learning 20(3) 273-297.  Cortes C. & Vapnik V. (1995 September). Support-vector networks. Machine learning 20(3) 273-297.","DOI":"10.1007\/BF00994018"},{"key":"e_1_3_2_1_4_1","volume-title":"Comparative Study of Apache Spark MLlib Clustering Algorithms. In International Conference on Data Mining and Big Data (pp. 61-73)","author":"Harifi S.","year":"2017","unstructured":"Harifi , S. , Byagowi , E. , & Khalilian , M. ( 2017 , July) . Comparative Study of Apache Spark MLlib Clustering Algorithms. In International Conference on Data Mining and Big Data (pp. 61-73) . Springer, Cham. Harifi, S., Byagowi, E., & Khalilian, M. (2017, July). Comparative Study of Apache Spark MLlib Clustering Algorithms. In International Conference on Data Mining and Big Data (pp. 61-73). Springer, Cham."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1002\/hep4.1182"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0156031"},{"key":"e_1_3_2_1_7_1","unstructured":"NCBI \u2013 PubMed. Retrieved August 28 2017 from https:\/\/www.ncbi.nlm.nih.gov\/pubmed\/.  NCBI \u2013 PubMed. Retrieved August 28 2017 from https:\/\/www.ncbi.nlm.nih.gov\/pubmed\/."},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"crossref","unstructured":"Peng C. Y. J. Lee K. L. & Ingersoll G. M. (2002 April). An introduction to logistic regression analysis and reporting. The journal of educational research 96(1) 3-14.  Peng C. Y. J. Lee K. L. & Ingersoll G. M. (2002 April). An introduction to logistic regression analysis and reporting. The journal of educational research 96(1) 3-14.","DOI":"10.1080\/00220670209598786"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"crossref","unstructured":"Raghupathi W. & Raghupathi V. (2014 February). Big data analytics in healthcare: promise and potential. Health information science and systems 2(1) 3.  Raghupathi W. & Raghupathi V. (2014 February). Big data analytics in healthcare: promise and potential. Health information science and systems 2(1) 3.","DOI":"10.1186\/2047-2501-2-3"},{"key":"e_1_3_2_1_10_1","volume-title":"A hadoop-based method to predict potential effective drug combination. BioMed research international","author":"Sun Y.","year":"2014","unstructured":"Sun , Y. , Xiong , Y. , Xu , Q. , & Wei , D. (2014, July ). A hadoop-based method to predict potential effective drug combination. BioMed research international , 2014 , 196858. Sun, Y., Xiong, Y., Xu, Q., & Wei, D. (2014, July). A hadoop-based method to predict potential effective drug combination. BioMed research international, 2014, 196858."},{"key":"e_1_3_2_1_11_1","volume-title":"PDQ Cancer Information Summaries [Internet].","author":"Cancer Genetics Overview","year":"2002","unstructured":"PDQ Cancer Genetics Overview (PDQ\u00ae). In: PDQ Cancer Information Summaries [Internet]. Bethesda, MD : National Cancer Institute ; 2002 . Retrieved November 01, 2017, from http:\/\/cancerres.aacrjournals.org\/content\/76\/22\/6747.full. PDQ Cancer Genetics Overview (PDQ\u00ae). In: PDQ Cancer Information Summaries [Internet]. Bethesda, MD: National Cancer Institute; 2002. Retrieved November 01, 2017, from http:\/\/cancerres.aacrjournals.org\/content\/76\/22\/6747.full."},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"crossref","unstructured":"Vincent B. Vincent M. & Ferreira C. G. (2006 March). Making PubMed searching simple: learning to retrieve medical literature through interactive problem solving. The oncologist 11(3) 243-251.  Vincent B. Vincent M. & Ferreira C. G. (2006 March). Making PubMed searching simple: learning to retrieve medical literature through interactive problem solving. The oncologist 11(3) 243-251.","DOI":"10.1634\/theoncologist.11-3-243"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"crossref","unstructured":"Wang S. H. Ding Y. Zhao W. Huang Y. H. Perkins R. Zou W. & Chen J. J. (2016 March). Text mining for identifying topics in the literatures about adolescent substance use and depression. BMC public health 16(1) 279.  Wang S. H. Ding Y. Zhao W. Huang Y. H. Perkins R. Zou W. & Chen J. J. (2016 March). Text mining for identifying topics in the literatures about adolescent substance use and depression. BMC public health 16(1) 279.","DOI":"10.1186\/s12889-016-2932-1"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0162721"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0156091"},{"key":"e_1_3_2_1_16_1","volume-title":"Feature extraction. Retrieved November, 01","author":"Scikit","year":"2017","unstructured":"Scikit - Learn - 4.2. Feature extraction. Retrieved November, 01 , 2017 , from http:\/\/scikit-learn.org\/stable\/modules\/feature_extraction.html Scikit- Learn - 4.2. Feature extraction. Retrieved November, 01, 2017, from http:\/\/scikit-learn.org\/stable\/modules\/feature_extraction.html"}],"event":{"name":"BDET 2021: 2021 the 3rd International Conference on Big Data Engineering and Technology","location":"Singapore Singapore","acronym":"BDET 2021"},"container-title":["2021 the 3rd International Conference on Big Data Engineering and Technology (BDET)"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3474944.3474958","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3474944.3474958","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T21:28:44Z","timestamp":1750195724000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3474944.3474958"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,1,16]]},"references-count":16,"alternative-id":["10.1145\/3474944.3474958","10.1145\/3474944"],"URL":"https:\/\/doi.org\/10.1145\/3474944.3474958","relation":{},"subject":[],"published":{"date-parts":[[2021,1,16]]},"assertion":[{"value":"2021-10-15","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}