{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,14]],"date-time":"2026-02-14T05:45:16Z","timestamp":1771047916454,"version":"3.50.1"},"reference-count":17,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2018,8,4]],"date-time":"2018-08-04T00:00:00Z","timestamp":1533340800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Grid Computing"],"published-print":{"date-parts":[[2019,6]]},"DOI":"10.1007\/s10723-018-9452-4","type":"journal-article","created":{"date-parts":[[2018,8,4]],"date-time":"2018-08-04T01:59:12Z","timestamp":1533347952000},"page":"357-366","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":8,"title":["Big Data Analytics, Text Mining and Modern English Language"],"prefix":"10.1007","volume":"17","author":[{"given":"Saqib","family":"Alam","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Nianmin","family":"Yao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2018,8,4]]},"reference":[{"key":"9452_CR1","doi-asserted-by":"crossref","unstructured":"Chou, S., Hsing, T.P.: Text mining technique for Chinese written judgment of criminal case. In: Pacific-Asia workshop on intelligence and security informatics, pp 113\u2013125. Springer, Berlin (2010)","DOI":"10.1007\/978-3-642-13601-6_14"},{"issue":"3","key":"9452_CR2","doi-asserted-by":"publisher","first-page":"441","DOI":"10.1080\/15326900701326576","volume":"31","author":"TL Griffiths","year":"2007","unstructured":"Griffiths, T.L., Kalish, M.L.: Language evolution by iterated learning with Bayesian agents. Cogn. Sci. 31(3), 441\u2013480 (2007)","journal-title":"Cogn. Sci."},{"key":"9452_CR3","unstructured":"Reed, J.W., Jiao, Y., Potok, T.E., Klump, B.A., Elmore, M.T., Hurson, A.R.: TF-ICF: A new term weighting scheme for clustering dynamic data streams. In: 5th international conference on machine learning and applications, 2006. ICMLA\u201906. (pp. 258-263). IEEE (2006)"},{"key":"9452_CR4","doi-asserted-by":"publisher","first-page":"87","DOI":"10.1016\/j.cognition.2015.06.009","volume":"143","author":"TT Hills","year":"2015","unstructured":"Hills, T.T., Adelman, J.S.: Recent evolution of learnability in American English from 1800 to 2000. Cognition 143, 87\u201392 (2015)","journal-title":"Cognition"},{"key":"9452_CR5","unstructured":"Ramos, J.: Using tf-idf to determine word relevance in document queries. In: Proceedings of the first instructional conference on machine learning, vol. 242, pp. 133\u2013142 (2003)"},{"issue":"1","key":"9452_CR6","doi-asserted-by":"publisher","first-page":"171545","DOI":"10.1098\/rsos.171545","volume":"5","author":"L Dias","year":"2018","unstructured":"Dias, L., Gerlach, M., Scharloth, J., Altmann, E.G.: Using text analysis to quantify the similarity and evolution of scientific disciplines. R. Soc. Open Sci. 5(1), 171545 (2018)","journal-title":"R. Soc. Open Sci."},{"key":"9452_CR7","volume-title":"English and general historical lexicology","author":"J Grzega","year":"2007","unstructured":"Grzega, J., Schoener, M.: English and general historical lexicology. Eichst\u00e4tt-Ingolstadt, Katholische Universit\u00e4t (2007)"},{"key":"9452_CR8","unstructured":"Firbas, J.A.N.: De Vordre des mots dans les langues anciennes com- pares aux langues modernes Question de grammaire generate (1844)"},{"issue":"1","key":"9452_CR9","doi-asserted-by":"publisher","first-page":"30","DOI":"10.1109\/TKDE.2010.211","volume":"24","author":"N Zhong","year":"2012","unstructured":"Zhong, N., Li, Y., Wu, S.T.: Effective pattern discovery for text mining. IEEE Trans. Knowl. Data Eng. 24(1), 30\u201344 (2012)","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"9452_CR10","doi-asserted-by":"crossref","unstructured":"Munkov\u00e1, D., Munk, M., Voz\u00e1r, M.: Influence of stop-words removal on sequence patterns identification within comparable corpora. In: ICT innovations 2013, pp 67\u201376. Springer, Heidelberg (2014)","DOI":"10.1007\/978-3-319-01466-1_6"},{"issue":"8","key":"9452_CR11","doi-asserted-by":"publisher","first-page":"e68178","DOI":"10.1371\/journal.pone.0068178","volume":"8","author":"Z Rehman","year":"2013","unstructured":"Rehman, Z., Anwar, W., Bajwa, U.I., Xuan, W., Chaoying, Z.: Morpheme matching based text tokenization for a scarce resourced language. PloS one 8(8), e68178 (2013)","journal-title":"PloS one"},{"key":"9452_CR12","doi-asserted-by":"crossref","unstructured":"Blumenstock, J.E.: Size matters: word count as a measure of quality on wikipedia. In: Proceedings of the 17th international conference on World Wide Web (pp. 1095\u20131096). ACM (2008)","DOI":"10.1145\/1367497.1367673"},{"issue":"5","key":"9452_CR13","doi-asserted-by":"publisher","first-page":"503","DOI":"10.1108\/00220410410560582","volume":"60","author":"S Robertson","year":"2004","unstructured":"Robertson, S.: Understanding inverse document frequency: on theoretical arguments for IDF. J. Doc. 60(5), 503\u2013520 (2004)","journal-title":"J. Doc."},{"issue":"5","key":"9452_CR14","doi-asserted-by":"publisher","first-page":"4760","DOI":"10.1016\/j.eswa.2011.09.160","volume":"39","author":"N Azam","year":"2012","unstructured":"Azam, N., Yao, J.: Comparison of term frequency and document frequency based feature selection metrics in text categorization. Expert Syst. Appl. 39(5), 4760\u20134768 (2012)","journal-title":"Expert Syst. Appl."},{"key":"9452_CR15","volume-title":"Beautiful evidence, vol. 1","author":"ER Tufte","year":"2006","unstructured":"Tufte, E.R.: Beautiful evidence, vol. 1. Graphics Press, Cheshire (2006)"},{"key":"9452_CR16","doi-asserted-by":"crossref","unstructured":"Hofmann, T.: August. Probabilistic latent semantic indexing. In: ACM SIGIR Forum (Vol. 51, No. 2, pp. 211-218). ACM (2017)","DOI":"10.1145\/3130348.3130370"},{"key":"9452_CR17","doi-asserted-by":"crossref","unstructured":"Zhai, C., Lafferty, J.: A study of smoothing methods for language models applied to ad hoc information retrieval. In: ACM SIGIR Forum (Vol. 51, No. 2, pp. 268-276). ACM (2017)","DOI":"10.1145\/3130348.3130377"}],"container-title":["Journal of Grid Computing"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10723-018-9452-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10723-018-9452-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10723-018-9452-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,8,3]],"date-time":"2019-08-03T19:05:10Z","timestamp":1564859110000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10723-018-9452-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,8,4]]},"references-count":17,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2019,6]]}},"alternative-id":["9452"],"URL":"https:\/\/doi.org\/10.1007\/s10723-018-9452-4","relation":{},"ISSN":["1570-7873","1572-9184"],"issn-type":[{"value":"1570-7873","type":"print"},{"value":"1572-9184","type":"electronic"}],"subject":[],"published":{"date-parts":[[2018,8,4]]},"assertion":[{"value":"20 March 2018","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"16 July 2018","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 August 2018","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}