{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,15]],"date-time":"2026-01-15T04:26:28Z","timestamp":1768451188196,"version":"3.49.0"},"reference-count":36,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2015,10,16]],"date-time":"2015-10-16T00:00:00Z","timestamp":1444953600000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0"}],"funder":[{"name":"The Omidyar Group"},{"DOI":"10.13039\/100011419","name":"Santa Fe Institute","doi-asserted-by":"crossref","id":[{"id":"10.13039\/100011419","id-type":"DOI","asserted-by":"crossref"}]},{"name":"NIH MIDAS Center of Excellence at the Harvard Center for Communicable Disease Dynamics"},{"name":"William Sick"},{"name":"Mike Frumkin and the Frumkin Falco Family Foundation"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["EPJ Data Sci."],"published-print":{"date-parts":[[2015,12]]},"DOI":"10.1140\/epjds\/s13688-015-0054-0","type":"journal-article","created":{"date-parts":[[2015,10,18]],"date-time":"2015-10-18T23:40:04Z","timestamp":1445211604000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":124,"title":["Enhancing disease surveillance with novel data streams: challenges and opportunities"],"prefix":"10.1140","volume":"4","author":[{"given":"Benjamin M","family":"Althouse","sequence":"first","affiliation":[]},{"given":"Samuel V","family":"Scarpino","sequence":"additional","affiliation":[]},{"given":"Lauren Ancel","family":"Meyers","sequence":"additional","affiliation":[]},{"given":"John W","family":"Ayers","sequence":"additional","affiliation":[]},{"given":"Marisa","family":"Bargsten","sequence":"additional","affiliation":[]},{"given":"Joan","family":"Baumbach","sequence":"additional","affiliation":[]},{"given":"John S","family":"Brownstein","sequence":"additional","affiliation":[]},{"given":"Lauren","family":"Castro","sequence":"additional","affiliation":[]},{"given":"Hannah","family":"Clapham","sequence":"additional","affiliation":[]},{"given":"Derek AT","family":"Cummings","sequence":"additional","affiliation":[]},{"given":"Sara","family":"Del Valle","sequence":"additional","affiliation":[]},{"given":"Stephen","family":"Eubank","sequence":"additional","affiliation":[]},{"given":"Geoffrey","family":"Fairchild","sequence":"additional","affiliation":[]},{"given":"Lyn","family":"Finelli","sequence":"additional","affiliation":[]},{"given":"Nicholas","family":"Generous","sequence":"additional","affiliation":[]},{"given":"Dylan","family":"George","sequence":"additional","affiliation":[]},{"given":"David R","family":"Harper","sequence":"additional","affiliation":[]},{"given":"Laurent","family":"H\u00e9bert-Dufresne","sequence":"additional","affiliation":[]},{"given":"Michael A","family":"Johansson","sequence":"additional","affiliation":[]},{"given":"Kevin","family":"Konty","sequence":"additional","affiliation":[]},{"given":"Marc","family":"Lipsitch","sequence":"additional","affiliation":[]},{"given":"Gabriel","family":"Milinovich","sequence":"additional","affiliation":[]},{"given":"Joseph D","family":"Miller","sequence":"additional","affiliation":[]},{"given":"Elaine O","family":"Nsoesie","sequence":"additional","affiliation":[]},{"given":"Donald R","family":"Olson","sequence":"additional","affiliation":[]},{"given":"Michael","family":"Paul","sequence":"additional","affiliation":[]},{"given":"Philip M","family":"Polgreen","sequence":"additional","affiliation":[]},{"given":"Reid","family":"Priedhorsky","sequence":"additional","affiliation":[]},{"given":"Jonathan M","family":"Read","sequence":"additional","affiliation":[]},{"given":"Isabel","family":"Rodr\u00edguez-Barraquer","sequence":"additional","affiliation":[]},{"given":"Derek J","family":"Smith","sequence":"additional","affiliation":[]},{"given":"Christian","family":"Stefansen","sequence":"additional","affiliation":[]},{"given":"David L","family":"Swerdlow","sequence":"additional","affiliation":[]},{"given":"Deborah","family":"Thompson","sequence":"additional","affiliation":[]},{"given":"Alessandro","family":"Vespignani","sequence":"additional","affiliation":[]},{"given":"Amy","family":"Wesolowski","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2015,10,16]]},"reference":[{"issue":"1","key":"54_CR1","doi-asserted-by":"crossref","DOI":"10.5210\/ojphi.v5i1.4456","volume":"5","author":"R Chunara","year":"2013","unstructured":"Chunara R, Aman S, Smolinski M, Brownstein JS (2013) Flu Near You: an online self-reported influenza surveillance system in the USA. Online J Public Health Inform 5(1):e133","journal-title":"Online J Public Health Inform"},{"issue":"1","key":"54_CR2","doi-asserted-by":"crossref","first-page":"17","DOI":"10.1111\/1469-0691.12477","volume":"20","author":"D Paolotti","year":"2014","unstructured":"Paolotti D, Carnahan A, Colizza V, Eames K, Edmunds J, Gomes G, Koppeschaar C, Rehn M, Smallenburg R, Turbelin C et al. (2014) Web-based participatory surveillance of infectious diseases: the Influenzanet participatory surveillance experience. Clin Microbiol Infect 20(1):17-21","journal-title":"Clin Microbiol Infect"},{"key":"54_CR3","doi-asserted-by":"crossref","DOI":"10.1371\/currents.RRN1251","volume":"3","author":"DR Olson","year":"2011","unstructured":"Olson DR, Paladini M, Lober WB, Buckeridge DL, ISDS Distribute Working Group (2011) Applying a new model for sharing population health data to national syndromic influenza surveillance: DiSTRIBuTE project proof of concept, 2006 to 2009. PLoS Curr 3:RRN1251","journal-title":"PLoS Curr"},{"issue":"1","key":"54_CR4","doi-asserted-by":"crossref","DOI":"10.5210\/ojphi.v5i1.4556","volume":"5","author":"KG Chester","year":"2013","unstructured":"Chester KG (2013) BioSense 2.0. Online J Public Health Inform 5(1):e200","journal-title":"Online J Public Health Inform"},{"key":"54_CR5","doi-asserted-by":"crossref","DOI":"10.1371\/journal.pntd.0001258","volume":"5","author":"BM Althouse","year":"2011","unstructured":"Althouse BM, Ng YY, Cummings DAT (2011) Prediction of dengue incidence using search query surveillance. PLoS Negl Trop Dis 5:e1258","journal-title":"PLoS Negl Trop Dis"},{"issue":"2","key":"54_CR6","doi-asserted-by":"crossref","first-page":"160","DOI":"10.1016\/S1473-3099(13)70244-5","volume":"14","author":"GJ Milinovich","year":"2014","unstructured":"Milinovich GJ, Williams GM, Clements AC, Hu W (2014) Internet-based surveillance systems for monitoring emerging infectious diseases. Lancet Infect Dis 14(2):160-168","journal-title":"Lancet Infect Dis"},{"issue":"11","key":"54_CR7","doi-asserted-by":"crossref","DOI":"10.1371\/journal.pone.0014118","volume":"5","author":"C Chew","year":"2010","unstructured":"Chew C, Eysenbach G (2010) Pandemics in the age of Twitter: content analysis of tweets during the 2009 H1N1 outbreak. PLoS ONE 5(11):e14118","journal-title":"PLoS ONE"},{"issue":"12","key":"54_CR8","doi-asserted-by":"crossref","DOI":"10.1371\/journal.pone.0083672","volume":"8","author":"DA Broniatowski","year":"2013","unstructured":"Broniatowski DA, Paul MJ, Dredze M (2013) National and local influenza surveillance through Twitter: an analysis of the 2012-2013 influenza epidemic. PLoS ONE 8(12):e83672","journal-title":"PLoS ONE"},{"issue":"4","key":"54_CR9","doi-asserted-by":"crossref","DOI":"10.1371\/journal.pcbi.1003581","volume":"10","author":"DJ McIver","year":"2014","unstructured":"McIver DJ, Brownstein JS (2014) Wikipedia usage estimates prevalence of influenza-like illness in the United States in near real-time. PLoS Comput Biol 10(4):e1003581","journal-title":"PLoS Comput Biol"},{"key":"54_CR10","doi-asserted-by":"crossref","unstructured":"Generous N, Fairchild G, Deshpande A, Del Valle SY, Priedhorsky R (2014) Global disease monitoring and forecasting with Wikipedia. arXiv:1405.3612","DOI":"10.1371\/journal.pcbi.1003892"},{"issue":"1","key":"54_CR11","doi-asserted-by":"crossref","DOI":"10.2196\/jmir.2998","volume":"16","author":"EO Nsoesie","year":"2014","unstructured":"Nsoesie EO, Buckeridge DL, Brownstein JS (2014) Guess who\u2019s not coming to dinner? Evaluating online restaurant reservations for disease surveillance. J Med Internet Res 16(1):e22","journal-title":"J Med Internet Res"},{"issue":"20","key":"54_CR12","first-page":"441","volume":"63","author":"C Harrison","year":"2014","unstructured":"Harrison C, Jorder M, Stern H, Stavinsky F, Reddy V, Hanson H, Waechter H, Lowe L, Gravano L, Balter S et al. (2014) Using online reviews by restaurant patrons to identify unreported cases of foodborne illness - New York City, 2012-2013. Morb Mort Wkly Rep 63(20):441-445","journal-title":"Morb Mort Wkly Rep"},{"issue":"Suppl","key":"54_CR13","first-page":"41","volume":"54","author":"D Das","year":"2005","unstructured":"Das D, Metzger K, Heffernan R, Balter S, Weiss D, Mostashari F et al. (2005) Monitoring over-the-counter medication sales for early detection of disease outbreaks - New York City. Morb Mort Wkly Rep 54(Suppl):41-46","journal-title":"Morb Mort Wkly Rep"},{"issue":"8","key":"54_CR14","doi-asserted-by":"crossref","DOI":"10.1371\/journal.pone.0043611","volume":"7","author":"A Patwardhan","year":"2012","unstructured":"Patwardhan A, Bilkovski R (2012) Comparison: flu prescription sales data from a retail pharmacy in the US with Google flu trends and US ILINet (CDC) data as flu activity indicator. PLoS ONE 7(8):e43611","journal-title":"PLoS ONE"},{"key":"54_CR15","doi-asserted-by":"crossref","first-page":"150","DOI":"10.1197\/jamia.M2544","volume":"15","author":"CC Freifeld","year":"2008","unstructured":"Freifeld CC, Mandl KD, Reis BY, Brownstein JS (2008) HealthMap: global infectious disease monitoring through automated classification and visualization of Internet media reports. J Am Med Inform Assoc 15:150-157","journal-title":"J Am Med Inform Assoc"},{"issue":"2","key":"54_CR16","doi-asserted-by":"crossref","first-page":"272","DOI":"10.1086\/510427","volume":"44","author":"PM Polgreen","year":"2007","unstructured":"Polgreen PM, Nelson FD, Neumann GR, Weinstein RA (2007) Use of prediction markets to forecast infectious disease activity. Clin Infect Dis 44(2):272-279","journal-title":"Clin Infect Dis"},{"key":"54_CR17","doi-asserted-by":"crossref","first-page":"1012","DOI":"10.1038\/nature07634","volume":"457","author":"J Ginsberg","year":"2008","unstructured":"Ginsberg J, Mohebbi MH, Patel RS, Brammer L, Smolinski MS, Brilliant L (2008) Detecting influenza epidemics using search engine query data. Nature 457:1012-1014","journal-title":"Nature"},{"key":"54_CR18","doi-asserted-by":"crossref","DOI":"10.1371\/journal.pcbi.1003256","volume":"9","author":"DR Olson","year":"2013","unstructured":"Olson DR, Konty KJ, Paladini M, Viboud C, Simonsen L (2013) Reassessing Google flu trends data for detection of seasonal and pandemic influenza: a comparative epidemiological study at three geographic scales. PLoS Comput Biol 9:e1003256","journal-title":"PLoS Comput Biol"},{"issue":"6176","key":"54_CR19","doi-asserted-by":"crossref","first-page":"1203","DOI":"10.1126\/science.1248506","volume":"343","author":"D Lazer","year":"2014","unstructured":"Lazer D, Kennedy R, King G, Vespignani A (2014) The parable of Google flu: traps in big data analysis. Science 343(6176):1203-1205","journal-title":"Science"},{"issue":"3","key":"54_CR20","doi-asserted-by":"crossref","first-page":"341","DOI":"10.1016\/j.amepre.2014.05.020","volume":"47","author":"M Santillana","year":"2014","unstructured":"Santillana M, Zhang DW, Althouse BM, Ayers JW (2014) What can digital disease detection learn from (an external revision to) Google flu trends? Am J Prev Med 47(3):341-347","journal-title":"Am J Prev Med"},{"issue":"5","key":"54_CR21","volume":"8","author":"Q Yuan","year":"2013","unstructured":"Yuan Q, Nsoesie EO, Lv B, Peng G, Chunara R, Brownstein JS (2013) Monitoring influenza epidemics in China with search query from Baidu. PLoS ONE 8(5):e64323","journal-title":"PLoS ONE"},{"key":"54_CR22","doi-asserted-by":"crossref","first-page":"1443","DOI":"10.1086\/593098","volume":"47","author":"PM Polgreen","year":"2008","unstructured":"Polgreen PM, Chen Y, Pennock DM, Nelson FD, Weinstein RA (2008) Using Internet searches for influenza surveillance. Clin Infect Dis 47:1443-1448","journal-title":"Clin Infect Dis"},{"issue":"4","key":"54_CR23","doi-asserted-by":"crossref","DOI":"10.1371\/journal.pcbi.1002472","volume":"8","author":"SV Scarpino","year":"2012","unstructured":"Scarpino SV, Dimitrov NB, Meyers LA (2012) Optimizing provider recruitment for influenza surveillance networks. PLoS Comput Biol 8(4):e1002472","journal-title":"PLoS Comput Biol"},{"issue":"14","key":"54_CR24","doi-asserted-by":"crossref","first-page":"1399","DOI":"10.1001\/jama.2014.1505","volume":"311","author":"JW Ayers","year":"2014","unstructured":"Ayers JW, Althouse BM, Dredze M (2014) Could behavioral medicine lead the web data revolution? JAMA 311(14):1399-1400","journal-title":"JAMA"},{"issue":"2","key":"54_CR25","doi-asserted-by":"crossref","first-page":"166","DOI":"10.1016\/j.amepre.2013.10.008","volume":"46","author":"BM Althouse","year":"2014","unstructured":"Althouse BM, Allem J-P, Childers MA, Dredze M, Ayers JW (2014) Population health concerns during the United States\u2019 Great Recession. Am J Prev Med 46(2):166-170","journal-title":"Am J Prev Med"},{"key":"54_CR26","author":"M Santillana","year":"2014","unstructured":"Santillana M, Nsoesie EO, Mekaru SR, Scales D, Brownstein JS (2014) Using clinicians\u2019 search query data to monitor influenza epidemics. Clin Infect Dis. doi: 10.1093\/cid\/ciu647","journal-title":"Clin Infect Dis"},{"key":"54_CR27","author":"JW Ayers","year":"2009","unstructured":"Ayers JW, Althouse BM, Ribisl KM, Emery S (2009) Digital detection for tobacco control: online reactions to the United States. Nicotine Tob Res. doi: 10.1093\/ntr\/ntt186","journal-title":"Nicotine Tob Res"},{"key":"54_CR28","doi-asserted-by":"crossref","DOI":"10.1371\/journal.pone.0016777","volume":"6","author":"JW Ayers","year":"2011","unstructured":"Ayers JW, Ribisl K, Brownstein JS (2011) Using search query surveillance to monitor tax avoidance and smoking cessation following the United States\u2019 2009 \u201cSCHIP\u201d cigarette tax increase. PLoS ONE 6:e16777","journal-title":"PLoS ONE"},{"key":"54_CR29","doi-asserted-by":"crossref","first-page":"81","DOI":"10.1016\/j.ypmed.2013.11.007","volume":"58","author":"JW Ayers","year":"2014","unstructured":"Ayers JW, Althouse BM, Noar SM, Cohen JE (2014) Do celebrity cancer diagnoses promote primary cancer prevention? Prev Med 58:81-84","journal-title":"Prev Med"},{"issue":"47","key":"54_CR30","doi-asserted-by":"crossref","first-page":"188","DOI":"10.1093\/jncimonographs\/lgt017","volume":"2013","author":"SM Noar","year":"2013","unstructured":"Noar SM, Ribisl KM, Althouse BM, Willoughby JF, Ayers JW (2013) Using digital surveillance to examine the impact of public figure pancreatic cancer announcements on media and search query outcomes. J Natl Cancer Inst Monographs 2013(47):188-194","journal-title":"J Natl Cancer Inst Monographs"},{"issue":"Suppl 5","key":"54_CR31","first-page":"1","volume":"37","author":"DN Klaucke","year":"1988","unstructured":"Klaucke DN, Buehler JW, Thacker SB, Parrish RG, Trowbridge FL, Berkelman RL et al. (1988) Guidelines for evaluating surveillance systems. Morb Mort Wkly Rep 37(Suppl 5):1-18","journal-title":"Morb Mort Wkly Rep"},{"key":"54_CR32","first-page":"1137","volume-title":"IJCAI\u201995","author":"R Kohavi","year":"1995","unstructured":"Kohavi R et al. (1995) A study of cross-validation and bootstrap for accuracy estimation and model selection. In: IJCAI\u201995, vol\u00a02, pp\u00a01137-1145"},{"key":"54_CR33","doi-asserted-by":"crossref","DOI":"10.1007\/978-0-387-84858-7","volume-title":"The elements of statistical learning","author":"T Hastie","year":"2009","unstructured":"Hastie T, Tibshirani R, Friedman J (2009) The elements of statistical learning, 2nd edn. Springer, Berlin","edition":"2"},{"key":"54_CR34","first-page":"668","volume-title":"Advances in neural information processing systems","author":"P Smyth","year":"1998","unstructured":"Smyth P, Wolpert D (1998) Stacked density estimation. In: Advances in neural information processing systems, pp\u00a0668-674"},{"key":"54_CR35","volume-title":"Machine learning: a probabilistic perspective","author":"KP Murphy","year":"2012","unstructured":"Murphy KP (2012) Machine learning: a probabilistic perspective. MIT Press, Cambridge"},{"key":"54_CR36","doi-asserted-by":"crossref","unstructured":"Wolpert DH (2012) What the no free lunch theorems really mean; how to improve search algorithms. Working paper, Santa Fe Institute","DOI":"10.1145\/2555235.2555237"}],"container-title":["EPJ Data Science"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1140\/epjds\/s13688-015-0054-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1140\/epjds\/s13688-015-0054-0\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1140\/epjds\/s13688-015-0054-0","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,5,16]],"date-time":"2020-05-16T00:16:40Z","timestamp":1589588200000},"score":1,"resource":{"primary":{"URL":"http:\/\/www.epjdatascience.com\/content\/4\/1\/17"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,10,16]]},"references-count":36,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2015,12]]}},"alternative-id":["54"],"URL":"https:\/\/doi.org\/10.1140\/epjds\/s13688-015-0054-0","relation":{},"ISSN":["2193-1127"],"issn-type":[{"value":"2193-1127","type":"electronic"}],"subject":[],"published":{"date-parts":[[2015,10,16]]},"article-number":"17"}}