{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,29]],"date-time":"2025-10-29T19:27:54Z","timestamp":1761766074738},"publisher-location":"Cham","reference-count":17,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319393773"},{"type":"electronic","value":"9783319393780"}],"license":[{"start":{"date-parts":[[2016,1,1]],"date-time":"2016-01-01T00:00:00Z","timestamp":1451606400000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016]]},"DOI":"10.1007\/978-3-319-39378-0_53","type":"book-chapter","created":{"date-parts":[[2016,5,28]],"date-time":"2016-05-28T07:40:51Z","timestamp":1464421251000},"page":"621-630","source":"Crossref","is-referenced-by-count":14,"title":["Distributed Classification of Text Documents on Apache Spark Platform"],"prefix":"10.1007","author":[{"given":"Piotr","family":"Semberecki","sequence":"first","affiliation":[]},{"given":"Henryk","family":"Maciejewski","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2016,5,29]]},"reference":[{"issue":"1","key":"53_CR1","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/505282.505283","volume":"34","author":"F Sebastiani","year":"2002","unstructured":"Sebastiani, F.: Machine learning in automated text categorization. ACM Comput. Surv. (CSUR) 34(1), 1\u201347 (2002)","journal-title":"ACM Comput. Surv. (CSUR)"},{"issue":"1","key":"53_CR2","doi-asserted-by":"crossref","first-page":"83","DOI":"10.1007\/s10579-009-9111-2","volume":"45","author":"M Koppel","year":"2011","unstructured":"Koppel, M., Schler, J., Argamon, S.: Authorship attribution in the wild. Lang. Resour. Eval. 45(1), 83\u201394 (2011)","journal-title":"Lang. Resour. Eval."},{"issue":"3","key":"53_CR3","doi-asserted-by":"crossref","first-page":"538","DOI":"10.1002\/asi.21001","volume":"60","author":"E Stamatatos","year":"2009","unstructured":"Stamatatos, E.: A survey of modern authorship attribution methods. JASIST 60(3), 538\u2013556 (2009)","journal-title":"JASIST"},{"issue":"4","key":"53_CR4","first-page":"301","volume":"6","author":"K Torkkola","year":"2004","unstructured":"Torkkola, K.: Discriminative features for text document classification. Formal Pattern Anal. Appl. 6(4), 301\u2013308 (2004)","journal-title":"Formal Pattern Anal. Appl."},{"key":"53_CR5","unstructured":"Jurafsky, D., Manning, C.: Natural Language Processing. https:\/\/www.coursera.org\/course\/nlp"},{"key":"53_CR6","first-page":"10","volume":"10","author":"M Zaharia","year":"2010","unstructured":"Zaharia, M., Chowdhury, M., Franklin, M.J., Shenker, S., Stoica, I.: Spark: cluster computing with working sets. HotCloud 10, 10 (2010)","journal-title":"HotCloud"},{"key":"53_CR7","doi-asserted-by":"crossref","unstructured":"Nesi, P., Pantaleo, G., Sanesi, G.: A distributed framework for NLP-based keyword and keyphrase extraction from web pages and documents. In: 21st International Conference on Distributed Multimedia Systems, DMS2015 (2015)","DOI":"10.18293\/DMS2015-024"},{"key":"53_CR8","volume-title":"Natural Language Processing with Python - Analyzing Text with the Natural Language Toolkit","author":"S Bird","year":"2009","unstructured":"Bird, S., Klein, E., Loper, E.: Natural Language Processing with Python - Analyzing Text with the Natural Language Toolkit. O\u2019Reilly, Beijing (2009)"},{"issue":"1","key":"53_CR9","doi-asserted-by":"crossref","first-page":"61","DOI":"10.14257\/ijdta.2014.7.1.06","volume":"7","author":"V Bijalwan","year":"2014","unstructured":"Bijalwan, V., et al.: KNN based machine learning approach for text and document mining. Int. J. Database Theo. Appl. 7(1), 61\u201370 (2014)","journal-title":"Int. J. Database Theo. Appl."},{"issue":"9","key":"53_CR10","doi-asserted-by":"crossref","first-page":"1264","DOI":"10.1109\/TKDE.2008.76","volume":"20","author":"D Isa","year":"2008","unstructured":"Isa, D., et al.: Text document preprocessing with the Bayes formula for classification using the support vector machine. IEEE Trans. Knowl. Data Eng. 20(9), 1264\u20131272 (2008)","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"53_CR11","doi-asserted-by":"crossref","unstructured":"Wang, L., Zhao, X.: Improved KNN classification algorithms research in text categorization. In: 2nd International Conference Consumer Electronics, Communications and Networks (CECNet), IEEE (2012)","DOI":"10.1109\/CECNet.2012.6201850"},{"key":"53_CR12","unstructured":"Perkins, J.: Python 3 Text Processing with NLTK 3 Cookbook. Packt Publishing (2014)"},{"key":"53_CR13","unstructured":"Dean, J., Ghemawat, S.: MapReduce: simplified data processing on large clusters. In: OSDI 2004 Sixth Symposium on Operating System Design and Implementation (2004)"},{"key":"53_CR14","unstructured":"Rosnova, D.: Practical Natural Language Processing with Hadoop. https:\/\/danrosanova.files.wordpress.com\/2014\/04\/practical-natural-language-processing-with-hadoop.pdf"},{"key":"53_CR15","doi-asserted-by":"crossref","unstructured":"Shvachko, K., Kuang, H., Radia, S., Chansler, R.: The Hadoop Distributed File System. Yahoo!, Sunnyvale, California USA (2010)","DOI":"10.1109\/MSST.2010.5496972"},{"key":"53_CR16","doi-asserted-by":"crossref","unstructured":"Zaharia, M., Das, T., Li, H., Hunter, T., Shenker, S., Stoica, I.: Discretized streams: fault-tolerant streaming computation at scale. In: Twenty-Fourth ACM Symposium on Operating Systems Principles, pp. 423\u2013438. ACM New York (2013)","DOI":"10.1145\/2517349.2522737"},{"key":"53_CR17","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1007\/978-3-319-07983-7_1","volume-title":"Natural Language Processing and Information Systems","author":"T Smedt De","year":"2014","unstructured":"De Smedt, T., Marfia, F., Matteucci, M., Daelemans, W.: Using wiktionary to build an italian part-of-speech tagger. In: M\u00e9tais, E., Roche, M., Teisseire, M. (eds.) NLDB 2014. LNCS, vol. 8455, pp. 1\u20138. Springer, Heidelberg (2014)"}],"container-title":["Lecture Notes in Computer Science","Artificial Intelligence and Soft Computing"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-39378-0_53","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,6,24]],"date-time":"2017-06-24T15:16:59Z","timestamp":1498317419000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-319-39378-0_53"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016]]},"ISBN":["9783319393773","9783319393780"],"references-count":17,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-39378-0_53","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2016]]}}}