{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,25]],"date-time":"2025-06-25T13:51:10Z","timestamp":1750859470003},"reference-count":16,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014,10]]},"DOI":"10.1109\/bigdata.2014.7004312","type":"proceedings-article","created":{"date-parts":[[2015,1,13]],"date-time":"2015-01-13T20:04:23Z","timestamp":1421179463000},"page":"825-834","source":"Crossref","is-referenced-by-count":3,"title":["Recall estimation for rare topic retrieval from large corpuses"],"prefix":"10.1109","author":[{"given":"Praveen","family":"Bommannavar","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Alek","family":"Kolcz","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Anand","family":"Rajaraman","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"15","doi-asserted-by":"publisher","DOI":"10.1145\/354756.354805"},{"journal-title":"Topical Host Reputation for Lightweight Url Classi-cation","year":"2012","author":"kolcz","key":"16"},{"key":"13","doi-asserted-by":"publisher","DOI":"10.1145\/2433396.2433450"},{"journal-title":"Mathematical Statistics and Data Analysis","year":"2007","author":"rice","key":"14"},{"key":"11","doi-asserted-by":"publisher","DOI":"10.1109\/SLT.2006.326780"},{"key":"12","doi-asserted-by":"crossref","DOI":"10.1007\/978-3-031-01555-7","author":"law","year":"2011","journal-title":"Human Computation (Synthesis Lectures on Arti-cial Intelligence and Machine Learning)"},{"key":"3","doi-asserted-by":"publisher","DOI":"10.1145\/279943.279962"},{"key":"2","doi-asserted-by":"publisher","DOI":"10.1145\/2623330.2623336"},{"journal-title":"Introduction to Information Retrieval","year":"2011","author":"manning","key":"1"},{"key":"10","doi-asserted-by":"publisher","DOI":"10.1145\/1645953.1646031"},{"key":"7","article-title":"Online strati-ed sampling: Evaluating classi-ers at web-scale","author":"bennett","year":"2010","journal-title":"Short-paper in Proceedings of the 19th ACM International Conference on Information and Knowledge Management (CIKM '10)"},{"key":"6","first-page":"1081","author":"he","year":"2009","journal-title":"Threshold Selection for Web-page Classi-cation with Highly Skewed Class Distribution"},{"journal-title":"Approximate Recall Con-dence Intervals","year":"2012","author":"webber","key":"5"},{"journal-title":"Counting Positives Accurately Despite Inaccurate Classi-cation","year":"2005","author":"forman","key":"4"},{"key":"9","doi-asserted-by":"publisher","DOI":"10.1108\/eb050097"},{"journal-title":"Evaluating Learning Algorithms A Classi-cation Perspective","year":"2008","author":"japkowicz","key":"8"}],"event":{"name":"2014 IEEE International Conference on Big Data (Big Data)","start":{"date-parts":[[2014,10,27]]},"location":"Washington, DC, USA","end":{"date-parts":[[2014,10,30]]}},"container-title":["2014 IEEE International Conference on Big Data (Big Data)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6973861\/7004197\/07004312.pdf?arnumber=7004312","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,7,31]],"date-time":"2023-07-31T22:01:16Z","timestamp":1690840876000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7004312\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014,10]]},"references-count":16,"URL":"https:\/\/doi.org\/10.1109\/bigdata.2014.7004312","relation":{},"subject":[],"published":{"date-parts":[[2014,10]]}}}