{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,20]],"date-time":"2025-12-20T22:20:40Z","timestamp":1766269240943},"reference-count":64,"publisher":"Oxford University Press (OUP)","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Digital Scholarship Humanities"],"DOI":"10.1093\/llc\/fqv037","type":"journal-article","created":{"date-parts":[[2015,9,3]],"date-time":"2015-09-03T02:14:02Z","timestamp":1441246442000},"page":"fqv037","source":"Crossref","is-referenced-by-count":25,"title":["The Impact of Lacking Metadata for the Measurement of Cultural and Linguistic Change Using the Google Ngram Data Sets\u2014Reconstructing the Composition of the German Corpus in Times of WWII"],"prefix":"10.1093","author":[{"given":"Alexander","family":"Koplenig","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"286","published-online":{"date-parts":[[2015,9,2]]},"reference":[{"key":"2015090219135172000_fqv037v1.1","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0059030"},{"key":"2015090219135172000_fqv037v1.2","volume-title":"Uncharted: Big Data as a Lens on Human Culture","author":"Aiden","year":"2013"},{"key":"2015090219135172000_fqv037v1.3","doi-asserted-by":"crossref","first-page":"777","DOI":"10.1515\/9783110213881.2.777","article-title":"Statistical methods for corpus exploitation","volume-title":"Corpus Linguistics: An International Handbook","author":"Baroni","year":"2009"},{"key":"2015090219135172000_fqv037v1.4","volume-title":"Introduction to Time Series Using Stata","author":"Becketti","year":"2013"},{"key":"2015090219135172000_fqv037v1.5","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0083147"},{"key":"2015090219135172000_fqv037v1.6","volume-title":"Die letzte Bonaparte: Freuds Prinzessin : ein Leben","author":"Bertin","year":"1989"},{"key":"2015090219135172000_fqv037v1.7","volume-title":"Variation across Speech and Writing","author":"Biber","year":"1991"},{"key":"2015090219135172000_fqv037v1.8","doi-asserted-by":"crossref","DOI":"10.1017\/CBO9780511804489","volume-title":"Corpus Linguistics: Investigating Language Structure and Use","author":"Biber","year":"1998"},{"key":"2015090219135172000_fqv037v1.9","doi-asserted-by":"crossref","first-page":"9","DOI":"10.1515\/cllt-2012-0002","article-title":"Register as a predictor of linguistic variation","volume":"8","author":"Biber","year":"2012","journal-title":"Corpus Linguistics and Linguistic Theory"},{"key":"2015090219135172000_fqv037v1.10","unstructured":"Biber D. Gray B. (2013). Being specific about historical change : the influence of sub-register. Journal of English Linguistics [Online]. http:\/\/eng.sagepub.com\/cgi\/doi\/10.1177\/0075424212472509 (accessed 14 April 2014)."},{"key":"2015090219135172000_fqv037v1.11","unstructured":"Blume D. Z\u00fcndorf I. (2014). Biografie Theodor Blank, in: LeMO-Biografien, Lebendiges Museum Online [Online]. http:\/\/www.hdg.de\/lemo\/biografie\/theodor-blank.html (accessed 15 May 2014)."},{"key":"2015090219135172000_fqv037v1.12","unstructured":"Bochkarev V. Solovyev V. Wichmann S. (2014). Universals versus Historical Contingencies in Lexical Evolution. [Online]. http:\/\/wwwstaff.eva.mpg.de\/%7Ewichmann\/LexEvolUploaded.pdf (accessed 12 June 2014)."},{"key":"2015090219135172000_fqv037v1.13","doi-asserted-by":"publisher","DOI":"10.1075\/ijcl.19.1.01bre"},{"key":"2015090219135172000_fqv037v1.14","doi-asserted-by":"publisher","DOI":"10.1177\/0022343313507302"},{"key":"2015090219135172000_fqv037v1.15","unstructured":"Culturomics (2014). Www.culturomics.org [Online]. http:\/\/www.culturomics.org\/ (accessed 8 September 2014)."},{"key":"2015090219135172000_fqv037v1.16","unstructured":"documentArchiv (2014). documentArchiv.de - Wehrgesetz (21.05.1935) [Online]. http:\/\/www.documentarchiv.de\/ns\/1935\/wehrgesetz.html (accessed 15 May 2014)."},{"key":"2015090219135172000_fqv037v1.17","doi-asserted-by":"publisher","DOI":"10.1093\/llc\/12.1.15"},{"key":"2015090219135172000_fqv037v1.18","doi-asserted-by":"publisher","DOI":"10.1093\/hwj\/dbn013"},{"key":"2015090219135172000_fqv037v1.19","unstructured":"Fr\u00fchwald J. (2012). Don\u2019t worry, I\u2019m a physicist. Val Systems [Online]. http:\/\/val-systems.blogspot.de\/2012\/07\/dont-worry-im-physicist.html (accessed 10 March 2014)."},{"key":"2015090219135172000_fqv037v1.20","doi-asserted-by":"publisher","DOI":"10.1098\/rsif.2011.0846"},{"key":"2015090219135172000_fqv037v1.21","doi-asserted-by":"crossref","unstructured":"Gerlach M. Altmann E. G. (2013). Stochastic model for the vocabulary growth in natural languages. Physical Review X [Online] 3. http:\/\/link.aps.org\/doi\/10.1103\/PhysRevX.3.021006 (accessed 12 June 2014).","DOI":"10.1103\/PhysRevX.3.021006"},{"key":"2015090219135172000_fqv037v1.22","doi-asserted-by":"publisher","DOI":"10.1093\/llc\/fqs054"},{"key":"2015090219135172000_fqv037v1.23","unstructured":"Google Inc . (2014). Google Ngram Viewer (datasets] [Online]. https:\/\/books.google.com\/ngrams (accessed 10 March 2014)."},{"key":"2015090219135172000_fqv037v1.24","unstructured":"Google Inc . (2015a). Google Ngram Viewer [Online]. https:\/\/books.google.com\/ngrams\/ (accessed 29 January 2015)."},{"key":"2015090219135172000_fqv037v1.25","unstructured":"Google Inc . (2015b). Library Partners \u2013 Google Books [Online]. http:\/\/www.google.com\/googlebooks\/library\/partners.html (accessed 29 January 2015)."},{"key":"2015090219135172000_fqv037v1.26","doi-asserted-by":"publisher","DOI":"10.1075\/ijcl.13.4.02gri"},{"key":"2015090219135172000_fqv037v1.27","unstructured":"Gulordava K. Baroni M. (2011). A distributional similarity approach to the detection of semantic change in the Google Books Ngram corpus. In: Proceedings of the GEMS 2011 Workshop on GEometrical Models of Natural Language Semantics Edinburgh, Scotland: Association for Computational Linguistics, pp. 67\u201371."},{"key":"2015090219135172000_fqv037v1.28","doi-asserted-by":"publisher","DOI":"10.1093\/llc\/fqn012"},{"key":"2015090219135172000_fqv037v1.29","doi-asserted-by":"publisher","DOI":"10.1093\/llc\/fqt015"},{"key":"2015090219135172000_fqv037v1.30","doi-asserted-by":"crossref","DOI":"10.1142\/8402","volume-title":"A Focus of Discoveries","author":"Huebener","year":"2012"},{"key":"2015090219135172000_fqv037v1.31","doi-asserted-by":"crossref","DOI":"10.5406\/illinois\/9780252037528.001.0001","volume-title":"Macroanalysis: Digital Methods and Literary History. Topics in the Digital Humanities","author":"Jockers","year":"2013"},{"key":"2015090219135172000_fqv037v1.32","unstructured":"Jockers M. L. (2010). Unigrams, and Bigrams, and Trigrams, Oh My [Online]. http:\/\/www.matthewjockers.net\/2010\/12\/22\/unigrams-and-bigrams-and-trigrams-oh-my\/ (accessed 10 March 2014)."},{"key":"2015090219135172000_fqv037v1.33","first-page":"33","article-title":"Some Aspects of the Development of Corpus Linguistics in the 1970s and 1980s","volume-title":"Corpus Linguistics: An International Handbook","author":"Johansson","year":"2009"},{"key":"2015090219135172000_fqv037v1.34","doi-asserted-by":"publisher","DOI":"10.1093\/llc\/fqt017"},{"key":"2015090219135172000_fqv037v1.35","volume-title":"Speech and Language Processing: An Introduction to Natural Language Processing, Computational Linguistics, and Speech Recognition","author":"Jurafsky","year":"2009"},{"key":"2015090219135172000_fqv037v1.36","doi-asserted-by":"publisher","DOI":"10.1080\/17439760.2012.715182"},{"key":"2015090219135172000_fqv037v1.37","unstructured":"Kestemont M. Karsdorp F. D\u00fcring M. (2014). Mining the Twentieth Century\u2019s History from the Time Magazine Corpus. In: Proceedings of LaTeCH 2014 \u2013 The 8th Workshop on Language Technology for Cultural Heritage, Social Sciences, and Humanities, Co-Located with EACL 2014 \u2013 the 14th Conference of the European Chapter of the Association for Computational Linguistics Gothenburg, Sweden, pp. 62\u201370."},{"key":"2015090219135172000_fqv037v1.38","doi-asserted-by":"publisher","DOI":"10.1075\/ijcl.6.1.05kil"},{"key":"2015090219135172000_fqv037v1.39","author":"Koplenig","year":""},{"key":"2015090219135172000_fqv037v1.40","unstructured":"Koplenig A. (2015). Using the parameters of the Zipf\u2013Mandelbrot law to measure diachronic lexical, syntactical and stylistic changes \u2013 a large-scale corpus analysis. Corpus Linguistics and Linguistic Theory [Online] 0. http:\/\/www.degruyter.com\/view\/j\/cllt.ahead-of-print\/cllt-2014\u20100049\/cllt-2014\u20100049.xml (accessed 19 April 2015)."},{"key":"2015090219135172000_fqv037v1.41","first-page":"37","article-title":"Genres, registers, text types, domains, and styles: clarifying the concepts and navigating a path through the BNC jungle","volume":"5","author":"Lee","year":"2001","journal-title":"Language Learning and Technology"},{"key":"2015090219135172000_fqv037v1.42","unstructured":"Liberman M. (2012a). Textual narcissism. Language Log [Online]. http:\/\/languagelog.ldc.upenn.edu\/nll\/?p=4069 (accessed 10 March 2014)."},{"key":"2015090219135172000_fqv037v1.43","unstructured":"Liberman M. (2012b). Textual narcissism, replication 2. Language Log [Online]. http:\/\/languagelog.ldc.upenn.edu\/nll\/?p=4071 (accessed 10 March 2014)."},{"key":"2015090219135172000_fqv037v1.44","unstructured":"Liberman M. (2013). Word String frequency distributions. Language Log [Online]. http:\/\/languagelog.ldc.upenn.edu\/nll\/?p=4456 (accessed 10 March 2014)."},{"key":"2015090219135172000_fqv037v1.45","doi-asserted-by":"crossref","unstructured":"Lijffijt J. Nevalainen T. S\u00e4ily T. Papapetrou P. (2014). Significance testing of word frequencies in corpora. Digital Scholarship in the Humanities [Online]. http:\/\/dsh.oxfordjournals.org\/cgi\/doi\/10.1093\/llc\/fqu064 (accessed 22 April 2015).","DOI":"10.1093\/llc\/fqu064"},{"key":"2015090219135172000_fqv037v1.46","article-title":"CEECing the baseline: Lexical stability and significant change in a historical corpus - Jefrey Lijffijt, Tanja S\u00e4ily & Terttu Nevalainen","volume-title":"Outposts of Historical Corpus Linguistics: From the Helsinki Corpus to a Proliferation of Resources","author":"Lijffijt","year":"2012"},{"key":"2015090219135172000_fqv037v1.47","unstructured":"Lin Y. Michel J.-B. Aiden L. E. (2012). Syntactic Annotations for the Google Books Ngram Corpus. In: Proceedings of the 50th Annual Meeting of the Association for Computational Linguistics Jeju, Republic of Korea, pp. 169\u201374."},{"key":"2015090219135172000_fqv037v1.48","doi-asserted-by":"crossref","first-page":"176","DOI":"10.1126\/science.1199644","article-title":"Quantitative analysis of culture using millions of Digitized Books","volume":"331","author":"Michel","year":"2010","journal-title":"Science"},{"key":"2015090219135172000_fqv037v1.49","unstructured":"Michel J.-B. Shen Y. K. Aiden A. P. (2010a). Quantitative analysis of culture using millions of Digitized Books (Supporting Online Material). Science [Online] 331. http:\/\/www.sciencemag.org\/content\/early\/2010\/12\/15\/science.1199644\/suppl\/DC1 (accessed 5 March 2014)."},{"key":"2015090219135172000_fqv037v1.50","doi-asserted-by":"crossref","unstructured":"Michel J.-B. Shen Y. K. Aiden A .P. (2010b). Quantitative analysis of culture using millions of Digitized Books (Supporting Online Material II). Science [Online] 331. http:\/\/www.sciencemag.org\/content\/331\/6014\/176\/suppl\/DC1 (accessed 5 March 2014).","DOI":"10.1126\/science.1199644"},{"key":"2015090219135172000_fqv037v1.51","first-page":"37","article-title":"English historical corpora in transition: from new tools to legacy corpora?","volume-title":"New Methods in Historical Corpora","author":"Nevalainen","year":"2013"},{"key":"2015090219135172000_fqv037v1.52","doi-asserted-by":"crossref","unstructured":"Pechenick E. A. Danforth C. M. Dodds P. S. (2015). Characterizing the Google Books corpus: strong limits to inferences of socio-cultural and linguistic evolution. [Online]. http:\/\/arxiv.org\/abs\/1501.00960.","DOI":"10.1371\/journal.pone.0137041"},{"key":"2015090219135172000_fqv037v1.53","doi-asserted-by":"publisher","DOI":"10.1098\/rsif.2012.0491"},{"key":"2015090219135172000_fqv037v1.54","doi-asserted-by":"crossref","unstructured":"Petersen A. M. Tenenbaum J. N. Havlin S. (2012a). Languages cool as they expand: Allometric scaling and the decreasing need for new words. Scientific Reports [Online] 2. http:\/\/www.nature.com\/doifinder\/10.1038\/srep00943 (accessed 10 March 2014).","DOI":"10.1038\/srep00943"},{"key":"2015090219135172000_fqv037v1.55","doi-asserted-by":"crossref","unstructured":"Petersen A. M. Tenenbaum J. N. Havlin S. Stanley H. E. (2012b). Statistical laws governing fluctuations in word use from word birth to word death. Scientific Reports [Online] 2. http:\/\/www.nature.com\/doifinder\/10.1038\/srep00313 (accessed 10 March 2014).","DOI":"10.1038\/srep00313"},{"key":"2015090219135172000_fqv037v1.56","doi-asserted-by":"publisher","DOI":"10.2202\/1944-2858.1173"},{"key":"2015090219135172000_fqv037v1.57","doi-asserted-by":"crossref","first-page":"101","DOI":"10.1515\/9783110226423.101","article-title":"Does frequency in text instantiate entrenchment in the cognitive system?","volume-title":"Quantitative Methods in Cognitive Semantics: Corpus-Driven Approaches","author":"Schmid","year":"2010"},{"key":"2015090219135172000_fqv037v1.58","unstructured":"Schmidt B. (2013). Are words the atomic unit of a dynamic system? Sapping Attention [Online]. http:\/\/sappingattention.blogspot.de\/2013\/02\/are-words-atomic-unit-of-dynmic-system.html (accessed 10 March 2014)."},{"key":"2015090219135172000_fqv037v1.59","unstructured":"Szmrecsanyi B. (2014). About text frequencies in historical linguistics: disentangling environmental and grammatical change. Corpus Linguistics and Linguistic Theory [Online]. http:\/\/www.benszm.net\/omnibuslit\/Szmrecsanyi_CH_web.pdf (accessed 8 September 2014)."},{"key":"2015090219135172000_fqv037v1.60","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0040181"},{"key":"2015090219135172000_fqv037v1.61","unstructured":"Underwood T. (2012). ngrams | The Stone and the Shell. The Stone and the Shell - Historical Questions Raised by a Quantitative Approach to Language [Online]. http:\/\/tedunderwood.com\/category\/ngrams\/ (accessed 10 March 2014)."},{"key":"2015090219135172000_fqv037v1.62","unstructured":"Wikimedia Foundation Inc . (2015a). Liste von Austriazismen \u2013 Wikipedia [Online]. http:\/\/de.wikipedia.org\/wiki\/Liste_von_Austriazismen (accessed 29 January 2015)."},{"key":"2015090219135172000_fqv037v1.63","unstructured":"Wikimedia Foundation Inc . (2015b). Liste von Helvetismen \u2013 Wikipedia [Online]. http:\/\/de.wikipedia.org\/wiki\/Liste_von_Helvetismen (accessed 29 January 2015)."},{"key":"2015090219135172000_fqv037v1.64","volume-title":"A People\u2019s History of the United States: 1492-Present","author":"Zinn","year":"2001"}],"container-title":["Digital Scholarship in the Humanities"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/academic.oup.com\/dsh\/article-pdf\/32\/1\/169\/17506188\/fqv037.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,8,30]],"date-time":"2019-08-30T04:02:36Z","timestamp":1567137756000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/dsh\/article-lookup\/doi\/10.1093\/llc\/fqv037"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,9,2]]},"references-count":64,"alternative-id":["10.1093\/llc\/fqv037"],"URL":"https:\/\/doi.org\/10.1093\/llc\/fqv037","relation":{},"ISSN":["2055-7671","2055-768X"],"issn-type":[{"value":"2055-7671","type":"print"},{"value":"2055-768X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2015,9,2]]}}}