{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,21]],"date-time":"2026-02-21T18:58:25Z","timestamp":1771700305365,"version":"3.50.1"},"reference-count":41,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2017,1,7]],"date-time":"2017-01-07T00:00:00Z","timestamp":1483747200000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2017,1,7]],"date-time":"2017-01-07T00:00:00Z","timestamp":1483747200000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"name":"National Science Foundation","award":["IIS - 1319578"],"award-info":[{"award-number":["IIS - 1319578"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Digit Libr"],"published-print":{"date-parts":[[2018,3]]},"DOI":"10.1007\/s00799-016-0207-1","type":"journal-article","created":{"date-parts":[[2017,1,7]],"date-time":"2017-01-07T10:52:35Z","timestamp":1483786355000},"page":"3-19","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":29,"title":["Focused crawler for events"],"prefix":"10.1007","volume":"19","author":[{"given":"Mohamed M. G.","family":"Farag","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Sunshin","family":"Lee","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Edward A.","family":"Fox","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2017,1,7]]},"reference":[{"issue":"1","key":"207_CR1","first-page":"17","volume":"1","author":"T O\u2019reilly","year":"2007","unstructured":"O\u2019reilly, T.: What is web 2.0: design patterns and business models for the next generation of software. Commun. Strateg. 1(1), 17 (2007)","journal-title":"Commun. Strateg."},{"key":"207_CR2","doi-asserted-by":"crossref","DOI":"10.1007\/978-3-031-02284-5","volume-title":"Digital Libraries Applications: CBIR, Education, Social Networks, eScience\/Simulation, and GIS","author":"EA Fox","year":"2014","unstructured":"Fox, E.A., Leidig, J.P.: Digital Libraries Applications: CBIR, Education, Social Networks, eScience\/Simulation, and GIS, vol. 6. Morgan & Claypool Publishers, San Rafael (2014)"},{"key":"207_CR3","doi-asserted-by":"crossref","DOI":"10.1007\/978-3-031-02285-2","volume-title":"Digital Library Technologies: Complex Objects, Annotation, Ontologies, Classification, Extraction, and Security","author":"EA Fox","year":"2014","unstructured":"Fox, E.A., da Silva Torres, R.: Digital Library Technologies: Complex Objects, Annotation, Ontologies, Classification, Extraction, and Security, vol. 6. Morgan & Claypool Publishers, San Rafael (2014)"},{"key":"207_CR4","doi-asserted-by":"crossref","DOI":"10.1007\/978-3-031-02283-8","volume-title":"Key Issues Regarding Digital Libraries: Evaluation and Integration","author":"R Shen","year":"2013","unstructured":"Shen, R., Goncalves, M.A., Fox, E.A.: Key Issues Regarding Digital Libraries: Evaluation and Integration, vol. 5. Morgan & Claypool Publishers, San Rafael (2013)"},{"key":"207_CR5","unstructured":"IDEAL. Integrated Digital Event Archive and Library. Accessed: 2016-07-26"},{"key":"207_CR6","unstructured":"Internet Archive. A digital library of free content and wayback machine. Accessed: 2016-07-26"},{"key":"207_CR7","unstructured":"Archive-It Collections. Spontaneous events. Accessed: 2016-07-26"},{"key":"207_CR8","doi-asserted-by":"crossref","unstructured":"Farag, M., Nakate, P., Fox, E.A.: Big data processing of school shooting archives. In: Proceedings of the 16th ACM\/IEEE-CS on Joint Conference on Digital Libraries, pp. 271\u2013272. ACM (2016)","DOI":"10.1145\/2910896.2925466"},{"key":"207_CR9","unstructured":"IDEAL Collections. IDEAL event collections. Accessed: 2016-07-26"},{"key":"207_CR10","unstructured":"Archive-It. Web archiving services for libraries and archives. Accessed: 2016-07-26"},{"issue":"10","key":"207_CR11","doi-asserted-by":"publisher","first-page":"1001","DOI":"10.1016\/j.datak.2009.04.002","volume":"68","author":"S Batsakis","year":"2009","unstructured":"Batsakis, S., Petrakis, E.G.M., Milios, E.: Improving the performance of focused web crawlers. Data Knowl. Eng. 68(10), 1001\u20131013 (2009)","journal-title":"Data Knowl. Eng."},{"issue":"11","key":"207_CR12","doi-asserted-by":"publisher","first-page":"1623","DOI":"10.1016\/S1389-1286(99)00052-3","volume":"31","author":"S Chakrabarti","year":"1999","unstructured":"Chakrabarti, S., Van den Berg, M., Dom, B.: Focused crawling: a new approach to topic-specific web resource discovery. Comput. Netw. 31(11), 1623\u20131640 (1999)","journal-title":"Comput. Netw."},{"issue":"4","key":"207_CR13","doi-asserted-by":"publisher","first-page":"430","DOI":"10.1145\/1095872.1095875","volume":"23","author":"G Pant","year":"2005","unstructured":"Pant, G., Srinivasan, P.: Learning to crawl: comparing classification schemes. ACM Trans. Inf. Syst. (TOIS) 23(4), 430\u2013462 (2005)","journal-title":"ACM Trans. Inf. Syst. (TOIS)"},{"key":"207_CR14","unstructured":"Rennie, J., McCallum, A.: Efficient web spidering with reinforcement learning. In: Proceedings of the International Conference on Machine Learning. Citeseer (1999)"},{"key":"207_CR15","doi-asserted-by":"crossref","unstructured":"Grigoriadis, A., Paliouras, G.: Focused crawling using temporal difference-learning. In: Hellenic Conference on Artificial Intelligence, pp. 142\u2013153. Springer (2004)","DOI":"10.1007\/978-3-540-24674-9_16"},{"key":"207_CR16","doi-asserted-by":"crossref","unstructured":"Singh, N., Sandhawalia, H., Monet, N., Poirier, H., Coursimault, J.-M.: Large scale URL-based classification using online incremental learning. In: 2012 11th International Conference on Machine Learning and Applications (ICMLA), vol.\u00a02, pp. 402\u2013409. IEEE (2012)","DOI":"10.1109\/ICMLA.2012.199"},{"key":"207_CR17","doi-asserted-by":"crossref","unstructured":"Menczer, F., Monge, A.E.: Scalable web search by adaptive online agents: an infospiders case study. In: Intelligent Information Agents, pp. 323\u2013347. Springer (1999)","DOI":"10.1007\/978-3-642-60018-0_17"},{"key":"207_CR18","unstructured":"Dong, H., Hussain, F.K., Chang, E.: A survey in semantic web technologies-inspired focused crawlers. In: Third International Conference on Digital Information Management, 2008 (ICDIM 2008), pp. 934\u2013936. IEEE (2008)"},{"key":"207_CR19","doi-asserted-by":"crossref","unstructured":"Ehrig, M., Maedche, A.: Ontology-focused crawling of web documents. In: Proceedings of the 2003 ACM symposium on Applied computing, pp. 1174\u20131178. ACM (2003)","DOI":"10.1145\/952532.952761"},{"issue":"6","key":"207_CR20","doi-asserted-by":"publisher","first-page":"886","DOI":"10.1016\/j.is.2006.09.004","volume":"32","author":"G Almpanidis","year":"2007","unstructured":"Almpanidis, G., Kotropoulos, C., Pitas, I.: Combining text and link analysis for focused crawling\u2014an application for vertical search engines. Inf. Syst. 32(6), 886\u2013908 (2007)","journal-title":"Inf. Syst."},{"key":"207_CR21","unstructured":"Diligenti, M., Coetzee, F., Lawrence, S., Giles, C.L., Gori, M. et\u00a0al.: Focused crawling using context graphs. In: VLDB, pp. 527\u2013534 (2000)"},{"issue":"1","key":"207_CR22","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1109\/TKDE.2006.12","volume":"18","author":"G Pant","year":"2006","unstructured":"Pant, G., Srinivasan, P.: Link contexts in classifier-guided topical crawlers. IEEE Trans. Knowl. Data Eng. 18(1), 107\u2013122 (2006)","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"207_CR23","doi-asserted-by":"crossref","unstructured":"Kleinberg, J.M., Kumar, R., Raghavan, P., Rajagopalan, S., Tomkins, A.S.: The web as a graph: measurements, models, and methods. In: International Computing and Combinatorics Conference, pp. 1\u201317. Springer (1999)","DOI":"10.1007\/3-540-48686-0_1"},{"issue":"18","key":"207_CR24","doi-asserted-by":"publisher","first-page":"3825","DOI":"10.1016\/j.comnet.2012.10.007","volume":"56","author":"S Brin","year":"2012","unstructured":"Brin, S., Page, L.: Reprint of: The anatomy of a large-scale hypertextual web search engine. Comput. Netw. 56(18), 3825\u20133833 (2012)","journal-title":"Comput. Netw."},{"key":"207_CR25","doi-asserted-by":"crossref","unstructured":"De\u00a0Assis, Guilherme\u00a0T., Laender, A.H.F., Gon\u00e7alves, M.A., Da\u00a0Silva, A.S.: Exploiting genre in focused crawling. In: International Symposium on String Processing and Information Retrieval, pp. 62\u201373. Springer (2007)","DOI":"10.1007\/978-3-540-75530-2_6"},{"issue":"2","key":"207_CR26","doi-asserted-by":"publisher","first-page":"345","DOI":"10.1287\/isre.1080.0231","volume":"21","author":"G Pant","year":"2010","unstructured":"Pant, G., Srinivasan, P.: Predicting web page status. Inf. Syst. Res. 21(2), 345\u2013364 (2010)","journal-title":"Inf. Syst. Res."},{"issue":"3","key":"207_CR27","doi-asserted-by":"publisher","first-page":"802","DOI":"10.1287\/isre.1120.0457","volume":"24","author":"G Pant","year":"2013","unstructured":"Pant, G., Srinivasan, P.: Status locality on the web: implications for building focused collections. Inf. Syst. Res. 24(3), 802\u2013821 (2013)","journal-title":"Inf. Syst. Res."},{"key":"207_CR28","unstructured":"Chen, Y.: A novel hybrid focused crawling algorithm to build domain-specific collections. PhD thesis, Virginia Polytechnic Institute and State University (2007)"},{"key":"207_CR29","doi-asserted-by":"crossref","unstructured":"Allan, J.: Introduction to topic detection and tracking. In: Topic detection and tracking, pp. 1\u201316. Springer (2002)","DOI":"10.1007\/978-1-4615-0933-2_1"},{"key":"207_CR30","unstructured":"Volkova, S., Caragea, D., Hsu, W.H., Bujuru, S.: Animal disease event recognition and classification. In: Proceedings of the First International Workshop on Web Science and Information Exchange in the Medical Web (MedEx 2010). Citeseer (2010)"},{"issue":"1","key":"207_CR31","doi-asserted-by":"publisher","first-page":"19","DOI":"10.1109\/MMUL.2007.23","volume":"14","author":"U Westermann","year":"2007","unstructured":"Westermann, U., Jain, R.: Toward a common event model for multimedia applications. IEEE Multimed. 14(1), 19\u201329 (2007)","journal-title":"IEEE Multimed."},{"key":"207_CR32","doi-asserted-by":"crossref","unstructured":"Str\u00f6tgen, J., Gertz, M., Junghans, C.: An event-centric model for multilingual document similarity. In: Proceedings of the 34th International ACM SIGIR Conference on Research and Development in Information Retrieval, pp. 953\u2013962. ACM (2011)","DOI":"10.1145\/2009916.2010043"},{"key":"207_CR33","unstructured":"Farag, M.M.G., Fox, E.A.: Intelligent event focused crawling. In: Proceedings of the 11th International ISCRAM Conference. University Park, Pennsylvania, USA (2014)"},{"key":"207_CR34","volume-title":"Topic Detection and Tracking: Event-Based Information Organization","author":"J Allan","year":"2012","unstructured":"Allan, J.: Topic Detection and Tracking: Event-Based Information Organization, vol. 12. Springer, Berlin (2012)"},{"key":"207_CR35","doi-asserted-by":"crossref","unstructured":"Gossen, G., Demidova, E., Risse, T.: iCrawl: improving the freshness of web collections by integrating social web and focused web crawling. In: Proceedings of the 15th ACM\/IEEE-CS Joint Conference on Digital Libraries, pp. 75\u201384. ACM (2015)","DOI":"10.1145\/2756406.2756925"},{"key":"207_CR36","doi-asserted-by":"crossref","unstructured":"AlNoamany, Y., Weigle, M.C., Nelson, M.L.: Detecting off-topic pages in web archives. In: International Conference on Theory and Practice of Digital Libraries, pp. 225\u2013237. Springer (2015)","DOI":"10.1007\/978-3-319-24592-8_17"},{"issue":"11","key":"207_CR37","doi-asserted-by":"publisher","first-page":"613","DOI":"10.1145\/361219.361220","volume":"18","author":"G Salton","year":"1975","unstructured":"Salton, G., Wong, A., Yang, C.-S.: A vector space model for automatic indexing. Commun. ACM 18(11), 613\u2013620 (1975)","journal-title":"Commun. ACM"},{"issue":"4","key":"207_CR38","doi-asserted-by":"publisher","first-page":"378","DOI":"10.1145\/1031114.1031117","volume":"4","author":"F Menczer","year":"2004","unstructured":"Menczer, F., Pant, G., Srinivasan, P.: Topical web crawlers: evaluating adaptive algorithms. ACM Trans. Internet Technol. (TOIT) 4(4), 378\u2013419 (2004)","journal-title":"ACM Trans. Internet Technol. (TOIT)"},{"key":"207_CR39","doi-asserted-by":"crossref","unstructured":"Klein, M., Shipman, J., Nelson, M.L.: Is this a good title? In: Proceedings of the 21st ACM Conference on Hypertext and Hypermedia, pp. 3\u201312. ACM (2010)","DOI":"10.1145\/1810617.1810621"},{"key":"207_CR40","doi-asserted-by":"crossref","unstructured":"Finkel, J.R., Grenager, T., Manning, C.: Incorporating non-local information into information extraction systems by gibbs sampling. In: Proceedings of the 43rd Annual Meeting on Association for Computational Linguistics, pp. 363\u2013370. Association for Computational Linguistics (2005)","DOI":"10.3115\/1219840.1219885"},{"key":"207_CR41","volume-title":"Modern Information Retrieval","author":"R Baeza-Yates","year":"1999","unstructured":"Baeza-Yates, R., Ribeiro-Neto, B., et al.: Modern Information Retrieval, vol. 463. ACM press, New York (1999)"}],"container-title":["International Journal on Digital Libraries"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s00799-016-0207-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00799-016-0207-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00799-016-0207-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,7,20]],"date-time":"2022-07-20T23:10:54Z","timestamp":1658358654000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s00799-016-0207-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,1,7]]},"references-count":41,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2018,3]]}},"alternative-id":["207"],"URL":"https:\/\/doi.org\/10.1007\/s00799-016-0207-1","relation":{},"ISSN":["1432-5012","1432-1300"],"issn-type":[{"value":"1432-5012","type":"print"},{"value":"1432-1300","type":"electronic"}],"subject":[],"published":{"date-parts":[[2017,1,7]]},"assertion":[{"value":"1 April 2016","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 December 2016","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"29 December 2016","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 January 2017","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}