{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,21]],"date-time":"2026-04-21T08:32:47Z","timestamp":1776760367972,"version":"3.51.2"},"reference-count":87,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2019,4,8]],"date-time":"2019-04-08T00:00:00Z","timestamp":1554681600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Lang Resources &amp; Evaluation"],"published-print":{"date-parts":[[2019,12]]},"DOI":"10.1007\/s10579-019-09456-6","type":"journal-article","created":{"date-parts":[[2019,4,9]],"date-time":"2019-04-09T03:21:56Z","timestamp":1554780116000},"page":"707-733","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":10,"title":["Beyond lexical frequencies: using R for text analysis in the digital humanities"],"prefix":"10.1007","volume":"53","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-0576-0669","authenticated-orcid":false,"given":"Taylor","family":"Arnold","sequence":"first","affiliation":[]},{"given":"Nicolas","family":"Ballier","sequence":"additional","affiliation":[]},{"given":"Paula","family":"Liss\u00f3n","sequence":"additional","affiliation":[]},{"given":"Lauren","family":"Tilton","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2019,4,8]]},"reference":[{"key":"9456_CR1","unstructured":"Allaire, J., Cheng, J., Xie, Y., McPherson, J., Chang, W., Allen, J., Wickham, H., Atkins, A., Hyndman, R., & Arslan, R. (2017). rmarkdown: Dynamic documents for R. R package version 1.6. https:\/\/cran.r-project.org\/package=rmarkdown ."},{"key":"9456_CR2","unstructured":"Anthony, L. (2004). Antconc: A learner and classroom friendly, multi-platform corpus analysis toolkit. In Proceedings of IWLeL (pp. 7\u201313)."},{"issue":"2","key":"9456_CR3","doi-asserted-by":"crossref","first-page":"141","DOI":"10.17250\/khisli.30.2.201308.001","volume":"30","author":"L Anthony","year":"2013","unstructured":"Anthony, L. (2013). A critical look at software tools in corpus linguistics. Linguistic Research, 30(2), 141\u2013161.","journal-title":"Linguistic Research"},{"key":"9456_CR4","unstructured":"Arnold, T., & Benoit, K. (2017). tif: Text interchange format. R package version 0.2. https:\/\/github.com\/ropensci\/tif\/ ."},{"key":"9456_CR5","unstructured":"Arnold, T., Liss\u00f3n, P., & Ballier, N. (2017). fasttextM: Work with bilingual word embeddings. R package version 0.0.1. https:\/\/github.com\/statsmaths\/fasttextM\/ ."},{"issue":"2","key":"9456_CR6","doi-asserted-by":"crossref","first-page":"1","DOI":"10.32614\/RJ-2017-035","volume":"9","author":"T Arnold","year":"2017","unstructured":"Arnold, T. (2017). A tidy data model for natural language processing using cleannlp. The R Journal, 9(2), 1\u201320.","journal-title":"The R Journal"},{"key":"9456_CR7","doi-asserted-by":"crossref","DOI":"10.1007\/978-3-319-20702-5","volume-title":"Humanities data in R","author":"T Arnold","year":"2015","unstructured":"Arnold, T., & Tilton, L. (2015). Humanities data in R. New York: Springer."},{"key":"9456_CR8","doi-asserted-by":"crossref","DOI":"10.1017\/CBO9780511801686","volume-title":"Analyzing linguistic data: A practical introduction to statistics using R","author":"RH Baayen","year":"2008","unstructured":"Baayen, R. H. (2008). Analyzing linguistic data: A practical introduction to statistics using R. Cambridge: Cambridge University Press."},{"key":"9456_CR9","unstructured":"Baglama, J., Reichel, L., & Lewis, B. W. (2017). irlba: Fast truncated singular value decomposition and principal components analysis for large dense and sparse matrices. R package version 2.2.1. https:\/\/cran.r-project.org\/package=irlba ."},{"key":"9456_CR10","unstructured":"Ballier, N., & Liss\u00f3n, P. (2017). R-based strategies for DH in English Linguistics: A case study. In Bockwinkel, P., Declerck, T., K\u00fcbler, S., Zinsmeister, H. (eds), Proceedings of the Workshop on Teaching NLP for Digital Humanities, CEUR Workshop Proceedings, Berlin, Germany (Vol. 1918, pp. 1\u201310). http:\/\/ceur-ws.org\/Vol-1918\/ballier.pdf ."},{"key":"9456_CR11","volume-title":"Donn\u00e9es, M\u00e9tadonn\u00e9es des corpus et catalogage des objets en sciences humaines et sociales","author":"N Ballier","year":"2016","unstructured":"Ballier, N. (2016). R, pour un \u00e9cosyst\u00e8me du traitement des donn\u00e9es? L\u2019exemple de la linguistique. In P. Caron (Ed.), Donn\u00e9es, M\u00e9tadonn\u00e9es des corpus et catalogage des objets en sciences humaines et sociales. Rennes: Presses universitaires de Rennes."},{"key":"9456_CR12","doi-asserted-by":"crossref","first-page":"361","DOI":"10.1609\/icwsm.v3i1.13937","volume":"8","author":"M Bastian","year":"2009","unstructured":"Bastian, M., Heymann, S., Jacomy, M., et al. (2009). Gephi: An open source software for exploring and manipulating networks. International Conference on Web and Social Media, 8, 361\u2013362.","journal-title":"International Conference on Web and Social Media"},{"key":"9456_CR13","volume-title":"S: An interactive environment for data analysis and graphics","author":"RA Becker","year":"1984","unstructured":"Becker, R. A., & Chambers, J. M. (1984). S: An interactive environment for data analysis and graphics. Boca Raton: CRC Press."},{"key":"9456_CR14","volume-title":"Analyse textuelle avec R","author":"M B\u00e9cue-Bertaut","year":"2018","unstructured":"B\u00e9cue-Bertaut, M., & Lebart, L. (2018). Analyse textuelle avec R. Rennes: Presses universitaires de Rennes."},{"key":"9456_CR15","unstructured":"Benoit, K., & Matsuo, A. (2017). spacyr: R Wrapper to the spaCy NLP Library. R package version 0.9.0. https:\/\/cran.r-project.org\/package=spacyr ."},{"key":"9456_CR16","unstructured":"Benoit, K., & Obeng, A. (2017). readtext: Import and handling for plain and formatted text files. R package version 0.50. https:\/\/cran.r-project.org\/package=readtext ."},{"key":"9456_CR17","unstructured":"Benoit, K., Watanabe, K., Nulty, P., Obeng, A., Wang, H., Lauderdale, B., & Lowe, W. (2017). Quanteda: Quantitative analysis of textual data. R package version 0.99.9. https:\/\/cran.r-project.org\/package=quanteda ."},{"key":"9456_CR18","first-page":"1","volume":"12","author":"DM Berry","year":"2011","unstructured":"Berry, D. M. (2011). The computational turn: Thinking about the digital humanities. Culture Machine, 12, 1\u201322.","journal-title":"Culture Machine"},{"key":"9456_CR19","doi-asserted-by":"crossref","unstructured":"Bird, S. (2006). NLTK: The natural language toolkit. In Proceedings of the COLING\/ACL on interactive presentation sessions, Association for Computational Linguistics (pp. 69\u201372).","DOI":"10.3115\/1225403.1225421"},{"key":"9456_CR20","unstructured":"Blevins, C., & Mullen, L. (2015). Jane, John ... Leslie? A historical method for algorithmic gender prediction. Digital Humanities Quarterly 9(3)."},{"key":"9456_CR21","unstructured":"Bradley, J., & Rockwell, G. (1992). Towards new research tools in computer-assisted text analysis. In Canadian Learned Societies Conference."},{"issue":"2","key":"9456_CR22","doi-asserted-by":"crossref","first-page":"139","DOI":"10.1075\/ijcl.20.2.01bre","volume":"20","author":"V Brezina","year":"2015","unstructured":"Brezina, V., McEnery, T., & Wattam, S. (2015). Collocations in context: A new perspective on collocation networks. International Journal of Corpus Linguistics, 20(2), 139\u2013173.","journal-title":"International Journal of Corpus Linguistics"},{"issue":"2","key":"9456_CR23","doi-asserted-by":"crossref","first-page":"513","DOI":"10.9788\/TP2013.2-16","volume":"21","author":"BV Camargo","year":"2013","unstructured":"Camargo, B. V., & Justo, A. M. (2013). Iramuteq: um software gratuito para an\u00e1lisede dados textuais. Temas em Psicologia, 21(2), 513\u2013518.","journal-title":"Temas em Psicologia"},{"key":"9456_CR24","unstructured":"Chang, W., Cheng, J., Allaire, J., Xie, Y., & McPherson, J. (2017). shiny: Web application framework for R. R package version 1.0.4. https:\/\/cran.r-project.org\/package=shiny ."},{"key":"9456_CR25","unstructured":"Deschamps, R. (2017). Correspondence analysis for historical research with R. The Programming Historian. https:\/\/programminghistorian.org\/en\/lessons\/correspondence-analysis-in-R ."},{"key":"9456_CR26","unstructured":"Dewar, T. (2016). R basics with tabular data. The Programming Historian. https:\/\/programminghistorian.org\/en\/lessons\/r-basicswith-tabular-data ."},{"key":"9456_CR27","unstructured":"Donaldson, J. (2016). tsne: T-distributed stochastic neighbor embedding for R (t-SNE). R package version 0.1-3. https:\/\/cran.r-project.org\/package=tsne ."},{"issue":"1","key":"9456_CR28","doi-asserted-by":"crossref","first-page":"107","DOI":"10.32614\/RJ-2016-007","volume":"8","author":"M Eder","year":"2016","unstructured":"Eder, M., Rybicki, J., & Kestemont, M. (2016). Stylometry with R: A package for computational text analysis. R Journal, 8(1), 107\u2013121.","journal-title":"R Journal"},{"issue":"5","key":"9456_CR29","doi-asserted-by":"crossref","first-page":"1","DOI":"10.18637\/jss.v025.i05","volume":"25","author":"I Feinerer","year":"2008","unstructured":"Feinerer, I., Hornik, K., & Meyer, D. (2008). Text mining infrastructure in R. Journal of Statistical Software, 25(5), 1\u201354.","journal-title":"Journal of Statistical Software"},{"key":"9456_CR30","unstructured":"Fleury, S., & Zimina, M. (2014). Trameur: A framework for annotated text corpora exploration. In COLING (Demos) (pp. 57\u201361)."},{"key":"9456_CR31","unstructured":"Gagolewski, M. (2017). R package stringi: Character string processing facilities. https:\/\/cran.r-project.org\/package=stringi ."},{"key":"9456_CR32","unstructured":"Gerdes, K. (2014). Corpus collection and analysis for the linguistic layman: The Gromoteur. http:\/\/gromoteur.ilpga.fr\/ ."},{"issue":"3","key":"9456_CR33","doi-asserted-by":"crossref","first-page":"359","DOI":"10.1353\/nlh.2014.0025","volume":"45","author":"A Goldstone","year":"2014","unstructured":"Goldstone, A., & Underwood, T. (2014). The quiet transformations of literary studies: What thirteen thousand scholars could tell us. New Literary History, 45(3), 359\u2013384.","journal-title":"New Literary History"},{"key":"9456_CR34","doi-asserted-by":"crossref","DOI":"10.1515\/9783110216042","volume-title":"Quantitative corpus linguistics with R: A practical introduction","author":"S Gries","year":"2009","unstructured":"Gries, S. (2009). Quantitative corpus linguistics with R: A practical introduction. London: Routledge."},{"key":"9456_CR35","doi-asserted-by":"crossref","DOI":"10.1515\/9783110307474","volume-title":"Statistics for linguistics with R: A practical introduction","author":"S Gries","year":"2013","unstructured":"Gries, S. (2013). Statistics for linguistics with R: A practical introduction. Berlin: Walter de Gruyter."},{"issue":"1","key":"9456_CR36","doi-asserted-by":"crossref","first-page":"109","DOI":"10.3366\/cor.2014.0053","volume":"9","author":"ST Gries","year":"2014","unstructured":"Gries, S. T., & Deshors, S. C. (2014). Using regressions to explore deviations between corpus data and a standard\/target: Two suggestions. Corpora, 9(1), 109\u2013136.","journal-title":"Corpora"},{"key":"9456_CR37","doi-asserted-by":"crossref","first-page":"35","DOI":"10.1075\/scl.51.02gri","volume-title":"Regression analysis in translation studies. Quantitative methods in corpus-based translation studies: A practical guide to descriptive translation research","author":"ST Gries","year":"2012","unstructured":"Gries, S. T., & Wulff, S. (2012). Regression analysis in translation studies. Quantitative methods in corpus-based translation studies: A practical guide to descriptive translation research (pp. 35\u201352). Amsterdam: Benjamins."},{"issue":"13","key":"9456_CR38","doi-asserted-by":"publisher","first-page":"1","DOI":"10.18637\/jss.v040.i13","volume":"40","author":"B Gr\u00fcn","year":"2011","unstructured":"Gr\u00fcn, B., & Hornik, K. (2011). topicmodels: An R package for fitting topic models. Journal of Statistical Software, 40(13), 1\u201330. https:\/\/doi.org\/10.18637\/jss.v040.i13 .","journal-title":"Journal of Statistical Software"},{"key":"9456_CR39","unstructured":"Heiden, S. (2010). The txm platform: Building open-source textual analysis software compatible with the tei encoding scheme. In 24th Pacific Asia conference on language, information and computation, Institute for Digital Enhancement of Cognitive Development, Waseda University (pp. 389\u2013398)."},{"key":"9456_CR40","doi-asserted-by":"crossref","unstructured":"Honnibal, M., & Johnson, M. (2015). An improved non-monotonic transition system for dependency parsing. In Proceedings of the 2015 conference on empirical methods in natural language processing, Association for Computational Linguistics, Lisbon, Portugal (pp. 1373\u20131378).","DOI":"10.18653\/v1\/D15-1162"},{"key":"9456_CR41","unstructured":"Hornik, K. (2016). openNLP: Apache OpenNLP tools interface. R package version 0.2-6. https:\/\/cran.r-project.org\/package=openNLP ."},{"key":"9456_CR42","unstructured":"Hornik, K. (2017a). NLP: Natural language processing infrastructure. R package version 0.1-11. https:\/\/cran.r-project.org\/package=NLP ."},{"key":"9456_CR43","unstructured":"Hornik, K. (2017b). R FAQ. https:\/\/cran.r-project.org\/doc\/FAQ\/R-FAQ.html ."},{"issue":"1","key":"9456_CR44","first-page":"505","volume":"9","author":"K Hornik","year":"2017","unstructured":"Hornik, K., Ligges, U., & Zeileis, A. (2017). Changes on CRAN. The R Journal, 9(1), 505\u2013507.","journal-title":"The R Journal"},{"issue":"3","key":"9456_CR45","first-page":"299","volume":"5","author":"R Ihaka","year":"1996","unstructured":"Ihaka, R., & Gentleman, R. (1996). R: A language for data analysis and graphics. Journal of Computational and Graphical Statistics, 5(3), 299\u2013314.","journal-title":"Journal of Computational and Graphical Statistics"},{"key":"9456_CR46","doi-asserted-by":"crossref","DOI":"10.5406\/illinois\/9780252037528.001.0001","volume-title":"Macroanalysis: Digital methods and literary history","author":"ML Jockers","year":"2013","unstructured":"Jockers, M. L. (2013). Macroanalysis: Digital methods and literary history. Champaign: University of Illinois Press."},{"key":"9456_CR47","doi-asserted-by":"crossref","DOI":"10.1007\/978-3-319-03164-4","volume-title":"Text analysis with R for students of literature","author":"ML Jockers","year":"2014","unstructured":"Jockers, M. L. (2014). Text analysis with R for students of literature. New York: Springer."},{"key":"9456_CR48","volume-title":"Quantitative methods in linguistics","author":"K Johnson","year":"2008","unstructured":"Johnson, K. (2008). Quantitative methods in linguistics. London: Wiley."},{"issue":"1","key":"9456_CR49","doi-asserted-by":"crossref","first-page":"144","DOI":"10.32614\/RJ-2013-014","volume":"5","author":"D Kahle","year":"2013","unstructured":"Kahle, D., & Wickham, H. (2013). ggmap: Spatial visualization with ggplot2. The R Journal, 5(1), 144\u2013161.","journal-title":"The R Journal"},{"issue":"1","key":"9456_CR50","doi-asserted-by":"crossref","first-page":"7","DOI":"10.1007\/s40607-014-0009-9","volume":"1","author":"A Kilgarriff","year":"2014","unstructured":"Kilgarriff, A., Baisa, V., Bu\u0161ta, J., Jakub\u00ed\u010dek, M., Kov\u00e1\u0159, V., Michelfeit, J., et al. (2014). The sketch engine: Ten years on. Lexicography, 1(1), 7\u201336.","journal-title":"Lexicography"},{"issue":"suppl 1","key":"9456_CR51","first-page":"i114","volume":"30","author":"C Klaussner","year":"2015","unstructured":"Klaussner, C., Nerbonne, J., & \u00c7\u00f6ltekin, \u00c7. (2015). Finding characteristic features in stylometric analysis. Digital Scholarship in the Humanities, 30(suppl 1), i114\u2013i129.","journal-title":"Digital Scholarship in the Humanities"},{"key":"9456_CR52","volume-title":"Cesax: Coreference editor for syntactically annotated xml corpora. Reference manual Nijmegen","author":"ER Komen","year":"2011","unstructured":"Komen, E. R. (2011). Cesax: Coreference editor for syntactically annotated xml corpora. Reference manual Nijmegen. Nijmegen: Radboud University Nijmegen."},{"key":"9456_CR53","unstructured":"Lamalle, C., Martinez, W., Fleury, S., Salem, A., Fracchiolla, B., Kuncova, A., & Maisondieu, A. (2003). Lexico3\u2013outils de statistique textuelle. manuel d\u2019utilisation. SYLED\u2013CLA2T, Universit\u00e9 de la Sorbonne nouvelle\u2013Paris 3:48."},{"key":"9456_CR54","volume-title":"Using tact with electronic texts","author":"I Lancashire","year":"1996","unstructured":"Lancashire, I., Bradley, J., McCarty, W., Stairs, M., & Wooldridge, T. (1996). Using tact with electronic texts. New York: MLA."},{"key":"9456_CR55","first-page":"1935","volume-title":"Documenting America","author":"LW Levine","year":"1988","unstructured":"Levine, L. W. (1988). Documenting America (Vol. 2, pp. 1935\u20131943). Berkeley: University of California Press."},{"key":"9456_CR56","doi-asserted-by":"crossref","DOI":"10.1075\/z.195","volume-title":"How to do linguistics with R: Data exploration and statistical analysis","author":"N Levshina","year":"2015","unstructured":"Levshina, N. (2015). How to do linguistics with R: Data exploration and statistical analysis. Amsterdam: John Benjamins Publishing Company."},{"issue":"1","key":"9456_CR57","doi-asserted-by":"crossref","first-page":"28","DOI":"10.1109\/LGRS.2009.2023536","volume":"7","author":"M Lienou","year":"2010","unstructured":"Lienou, M., Maitre, H., & Datcu, M. (2010). Semantic annotation of satellite images using latent dirichlet allocation. IEEE Geoscience and Remote Sensing Letters, 7(1), 28\u201332.","journal-title":"IEEE Geoscience and Remote Sensing Letters"},{"key":"9456_CR58","doi-asserted-by":"crossref","unstructured":"Manning, C. D., Surdeanu, M., Bauer, J., Finkel, J. R., Bethard, S., & McClosky, D. (2014). The stanford corenlp natural language processing toolkit. In ACL (system demonstrations) (pp. 55\u201360).","DOI":"10.3115\/v1\/P14-5010"},{"key":"9456_CR59","doi-asserted-by":"crossref","DOI":"10.1017\/CBO9780511981395","volume-title":"Corpus linguistics: Method, theory and practice","author":"T McEnery","year":"2011","unstructured":"McEnery, T., & Hardie, A. (2011). Corpus linguistics: Method, theory and practice. Cambridge: Cambridge University Press."},{"key":"9456_CR60","unstructured":"Michalke, M. (2017). koRpus: An R package for text analysis. (Version 0.10-2). https:\/\/cran.rproject.org\/package=koRpus ."},{"key":"9456_CR61","unstructured":"Mimno, D. (2013). mallet: A wrapper around the Java machine learning tool MALLET. R package version 1.0. https:\/\/cran.r-project.org\/package=mallet ."},{"key":"9456_CR62","unstructured":"Morton, T., Kottmann, J., Baldridge, J., & Bierner, G. (2005). Opennlp: A java-based nlp toolkit. In EACL."},{"key":"9456_CR63","unstructured":"O\u2019Donnell, M. (2008). The uam corpustool: Software for corpus annotation and exploration. In Proceedings of the XXvI congreso de AESLA, Almeria, Spain (pp. 3\u20135)."},{"key":"9456_CR64","unstructured":"Ooms, J. (2017). hunspell: High-performance Stemmer, Tokenizer, and spell checker for R. R package version 2.6. https:\/\/cran.r-project.org\/package=hunspell ."},{"issue":"suppl 1","key":"9456_CR65","first-page":"i142","volume":"30","author":"J O\u2019Sullivan","year":"2015","unstructured":"O\u2019Sullivan, J., Jakacki, D., & Galvin, M. (2015). Programming in the digital humanities. Digital Scholarship in the Humanities, 30(suppl 1), i142\u2013i147.","journal-title":"Digital Scholarship in the Humanities"},{"issue":"6060","key":"9456_CR66","doi-asserted-by":"crossref","first-page":"1226","DOI":"10.1126\/science.1213847","volume":"334","author":"RD Peng","year":"2011","unstructured":"Peng, R. D. (2011). Reproducible research in computational science. Science, 334(6060), 1226\u20131227.","journal-title":"Science"},{"key":"9456_CR67","unstructured":"Rayson, P. (2009). Wmatrix: A web-based corpus processing environment. http:\/\/ucrel.lancs.ac.uk\/wmatrix\/ ."},{"key":"9456_CR68","volume-title":"qdap: Quantitative discourse analysis package","author":"TW Rinker","year":"2013","unstructured":"Rinker, T. W. (2013). qdap: Quantitative discourse analysis package. Buffalo, NY: University at Buffalo\/SUNY. 2.2.8."},{"key":"9456_CR69","volume-title":"RStudio: Integrated development environment for R","author":"RStudio Team","year":"2017","unstructured":"RStudio Team. (2017). RStudio: Integrated development environment for R. Boston, MA: RStudio Inc."},{"key":"9456_CR70","unstructured":"Rudis, B., Levien, R., Engelhard, R., Halls, C., Novodvorsky, P., N\u00e9meth, L., & Buitenhuis, N. (2016). hyphenatr: Tools to Hyphenate Strings Using the \u2019Hunspell\u2019 Hyphenation Library. R package version 0.3.0. https:\/\/cran.r-project.org\/package=hyphenatr ."},{"key":"9456_CR71","first-page":"4","volume":"9","author":"R Salkie","year":"1995","unstructured":"Salkie, R. (1995). Intersect: A parallel corpus project at brighton university. Computers and Texts, 9, 4\u20135.","journal-title":"Computers and Texts"},{"key":"9456_CR72","doi-asserted-by":"crossref","DOI":"10.1002\/9781118680605","volume-title":"A new companion to digital humanities","author":"S Schreibman","year":"2015","unstructured":"Schreibman, S., Siemens, R., & Unsworth, J. (2015). A new companion to digital humanities. London: Wiley."},{"key":"9456_CR73","unstructured":"Scott, M. (1996). WordSmith tools, Stroud: Lexical analysis software. https:\/\/lexically.net\/wordsmith\/ ."},{"key":"9456_CR74","unstructured":"Siddiqui, N. (2017). Data wrangling and management in R. The Programming Historian. https:\/\/programminghistorian.org\/en\/lessons\/data_wrangling_and_management_in_R ."},{"key":"9456_CR75","unstructured":"Sievert, C., & Shirley, K. (2015). LDAtools: Tools to fit a topic model using Latent Dirichlet Allocation (LDA). R package version 0.1. https:\/\/cran.r-project.org\/package=LDAtools ."},{"issue":"5","key":"9456_CR76","doi-asserted-by":"crossref","first-page":"1","DOI":"10.18637\/jss.v039.i05","volume":"39","author":"N Simon","year":"2011","unstructured":"Simon, N., Friedman, J., Hastie, T., & Tibshirani, R. (2011). Regularization paths for cox\u2019s proportional hazards model via coordinate descent. Journal of Statistical Software, 39(5), 1\u201313.","journal-title":"Journal of Statistical Software"},{"key":"9456_CR77","unstructured":"Sinclair, S., Rockwell, G., et al. (2016). Voyant tools. http:\/\/voyant-tools.org\/ . Accessed 4 Sept 2018."},{"issue":"1","key":"9456_CR78","doi-asserted-by":"crossref","first-page":"59","DOI":"10.3366\/E1749503208000075","volume":"3","author":"S Th Gries","year":"2008","unstructured":"Th Gries, S., & Hilpert, M. (2008). The identification of stages in diachronic data: Variability-based neighbour clustering. Corpora, 3(1), 59\u201381.","journal-title":"Corpora"},{"key":"9456_CR79","unstructured":"Underwood, T. (2017). A genealogy of distant reading. Digital Humanities Quarterly. http:\/\/digitalhumanities.org\/dhq\/vol\/11\/2\/000317\/000317.html ."},{"key":"9456_CR80","unstructured":"Ushey, K., McPherson, J., Cheng, J., Atkins, A., & Allaire, J. (2016). packrat: A dependency management system for projects and their R package dependencies. R package version 0.4.8-1. https:\/\/cran.r-project.org\/package=packrat ."},{"key":"9456_CR81","unstructured":"Wang, X., & Grimson, E. (2008). Spatial latent Dirichlet Allocation. In: Advances in neural information processing systems 20 (pp. 1577\u20131584). Curran Associates, Inc. http:\/\/papers.nips.cc\/paper\/3278-spatial-latent-dirichlet-allocation.pdf ."},{"issue":"4","key":"9456_CR82","doi-asserted-by":"crossref","first-page":"245","DOI":"10.1080\/19312458.2017.1387238","volume":"11","author":"K Welbers","year":"2017","unstructured":"Welbers, K., Van Atteveldt, W., & Benoit, K. (2017). Text analysis in R. Communication Methods and Measures, 11(4), 245\u2013265.","journal-title":"Communication Methods and Measures"},{"key":"9456_CR83","unstructured":"Wiedemann, G., & Niekler, A. (2017). Hands-on: A five day text mining course for humanists and social scientists in R. In Proceedings of the 1st workshop teaching NLP for digital humanities."},{"key":"9456_CR84","doi-asserted-by":"crossref","DOI":"10.1007\/978-3-658-15309-0","volume-title":"Text mining for qualitative data analysis in the social sciences","author":"G Wiedemann","year":"2016","unstructured":"Wiedemann, G. (2016). Text mining for qualitative data analysis in the social sciences. New York: Springer."},{"key":"9456_CR85","unstructured":"Wijffels, J. (2018). udpipe: Tokenization, parts of speech tagging, lemmatization and dependency parsing with the \u2019UDPipe\u2019 \u2019NLP\u2019 Toolkit. R package version 0.6.1. https:\/\/cran.r-project.org\/package=udpipe ."},{"issue":"1\u20133","key":"9456_CR86","doi-asserted-by":"crossref","first-page":"37","DOI":"10.1016\/0169-7439(87)80084-9","volume":"2","author":"S Wold","year":"1987","unstructured":"Wold, S., Esbensen, K., & Geladi, P. (1987). Principal component analysis. Chemometrics and Intelligent Laboratory Systems, 2(1\u20133), 37\u201352.","journal-title":"Chemometrics and Intelligent Laboratory Systems"},{"key":"9456_CR87","unstructured":"Xie, Y. (2014). knitr: A comprehensive tool for reproducible research in R. In: Stodden, V., Leisch, F., & Peng, R. D. (eds), Implementing reproducible computational research. Chapman and Hall\/CRC. ISBN: 978-1466561595."}],"container-title":["Language Resources and Evaluation"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10579-019-09456-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10579-019-09456-6\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10579-019-09456-6.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,9,15]],"date-time":"2023-09-15T14:31:22Z","timestamp":1694788282000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10579-019-09456-6"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,4,8]]},"references-count":87,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2019,12]]}},"alternative-id":["9456"],"URL":"https:\/\/doi.org\/10.1007\/s10579-019-09456-6","relation":{},"ISSN":["1574-020X","1574-0218"],"issn-type":[{"value":"1574-020X","type":"print"},{"value":"1574-0218","type":"electronic"}],"subject":[],"published":{"date-parts":[[2019,4,8]]},"assertion":[{"value":"8 April 2019","order":1,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}