{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,24]],"date-time":"2026-03-24T15:26:41Z","timestamp":1774366001425,"version":"3.50.1"},"publisher-location":"Cham","reference-count":31,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031708893","type":"print"},{"value":"9783031708909","type":"electronic"}],"license":[{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024]]},"DOI":"10.1007\/978-3-031-70890-9_8","type":"book-chapter","created":{"date-parts":[[2024,9,5]],"date-time":"2024-09-05T09:24:24Z","timestamp":1725528264000},"page":"144-161","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["CRATOR a\u00a0CRAwler for\u00a0TOR: Turning Dark Web Pages into Open Source INTelligence"],"prefix":"10.1007","author":[{"given":"Daniel","family":"De Pascale","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Giuseppe","family":"Cascavilla","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Damian A.","family":"Tamburri","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Willem Jan","family":"Van Den Heuvel","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2024,9,6]]},"reference":[{"key":"8_CR1","unstructured":"Santos, A., Pham, K.: Ache focused crawler (2023). https:\/\/github.com\/VIDA-NYU\/ache"},{"key":"8_CR2","doi-asserted-by":"crossref","unstructured":"Barbosa, L., Freire, J.: An adaptive crawler for locating hidden-web entry points. In: Proceedings of the 16th international conference on World Wide Web, pp. 441\u2013450 (2007)","DOI":"10.1145\/1242572.1242632"},{"key":"8_CR3","doi-asserted-by":"publisher","first-page":"35914","DOI":"10.1109\/ACCESS.2023.3255165","volume":"11","author":"J Bergman","year":"2023","unstructured":"Bergman, J., Popov, O.B.: Exploring dark web crawlers: a systematic literature review of dark web crawlers and their implementation. IEEE Access 11, 35914\u201335933 (2023)","journal-title":"IEEE Access"},{"issue":"2","key":"8_CR4","doi-asserted-by":"publisher","first-page":"23","DOI":"10.5121\/ijdkp.2013.3202","volume":"3","author":"K Bharati","year":"2013","unstructured":"Bharati, K., Premchand, P., Govardhan, A.: HIGWGET-a model for crawling secure hidden webpages. Int. J. Data Min. Knowl. Manage. Process 3(2), 23 (2013)","journal-title":"Int. J. Data Min. Knowl. Manage. Process"},{"issue":"2","key":"8_CR5","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3160017","volume":"12","author":"P Boldi","year":"2018","unstructured":"Boldi, P., Marino, A., Santini, M., Vigna, S.: BUbiNG: massive crawling for the masses. ACM Trans. Web (TWEB) 12(2), 1\u201326 (2018)","journal-title":"ACM Trans. Web (TWEB)"},{"key":"8_CR6","doi-asserted-by":"crossref","unstructured":"Boshmaf, Y., Perera, I., Kumarasinghe, U., Liyanage, S., Al\u00a0Jawaheri, H.: Dizzy: large-scale crawling and analysis of onion services. In: Proceedings of the 18th International Conference on Availability, Reliability and Security, pp. 1\u201311 (2023)","DOI":"10.1145\/3600160.3600167"},{"key":"8_CR7","doi-asserted-by":"publisher","unstructured":"Cascavilla, G.: The rise of cybercrime and cyber-threat intelligence: perspectives and challenges from law enforcement. IEEE Secur. Priv. (01), 2\u201311 (2024). https:\/\/doi.org\/10.1109\/MSEC.2024.3407859","DOI":"10.1109\/MSEC.2024.3407859"},{"key":"8_CR8","doi-asserted-by":"publisher","DOI":"10.1016\/j.cose.2021.102258","volume":"105","author":"G Cascavilla","year":"2021","unstructured":"Cascavilla, G., Tamburri, D.A., Van Den Heuvel, W.J.: Cybercrime threat intelligence: a systematic multi-vocal literature review. Comput. Secur. 105, 102258 (2021)","journal-title":"Comput. Secur."},{"key":"8_CR9","doi-asserted-by":"crossref","unstructured":"Celestini, A., Guarino, S.: Design, implementation and test of a flexible tor-oriented web mining toolkit. In: Proceedings of the 7th International Conference on Web Intelligence, Mining and Semantics, pp. 1\u201310 (2017)","DOI":"10.1145\/3102254.3102266"},{"key":"8_CR10","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/978-3-642-29892-9_1","volume-title":"Formal Concept Analysis","author":"H Chen","year":"2012","unstructured":"Chen, H.: Dark web: exploring and mining the dark side of the web. In: Domenach, F., Ignatov, D.I., Poelmans, J. (eds.) ICFCA 2012. LNCS (LNAI), vol. 7278, pp. 1\u20131. Springer, Heidelberg (2012). https:\/\/doi.org\/10.1007\/978-3-642-29892-9_1"},{"issue":"1\u20137","key":"8_CR11","doi-asserted-by":"publisher","first-page":"161","DOI":"10.1016\/S0169-7552(98)00108-1","volume":"30","author":"J Cho","year":"1998","unstructured":"Cho, J., Garcia-Molina, H., Page, L.: Efficient crawling through URL ordering. Comput. Netw. ISDN Syst. 30(1\u20137), 161\u2013172 (1998)","journal-title":"Comput. Netw. ISDN Syst."},{"key":"8_CR12","doi-asserted-by":"publisher","unstructured":"De\u00a0Pascale, D., Cascavilla, G., Tamburri, D.A., Van Den\u00a0Heuvel, W.J.: SENSEI: scraper for enhanced analysis to evaluate illicit trends. In: Troya, J., et al. (eds.) International Conference on Service-Oriented Computing, pp. 374\u2013383. Springer, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-031-26507-5_36","DOI":"10.1007\/978-3-031-26507-5_36"},{"key":"8_CR13","doi-asserted-by":"publisher","unstructured":"Dhabliya, D., Alawadi, A.H., Rai, V.K., Velusudha, N., Sarathy, K.: Evaluation of focused web crawlers in real-world scenarios. In: 2023 3rd International Conference on Technological Advancements in Computational Sciences (ICTACS), pp. 711\u2013715 (2023). https:\/\/doi.org\/10.1109\/ICTACS59847.2023.10389832","DOI":"10.1109\/ICTACS59847.2023.10389832"},{"issue":"8","key":"8_CR14","doi-asserted-by":"publisher","first-page":"880","DOI":"10.1016\/j.comcom.2005.01.003","volume":"28","author":"MD Dikaiakos","year":"2005","unstructured":"Dikaiakos, M.D., Stassopoulou, A., Papageorgiou, L.: An investigation of web crawler behavior: characterization and metrics. Comput. Commun. 28(8), 880\u2013897 (2005)","journal-title":"Comput. Commun."},{"key":"8_CR15","doi-asserted-by":"publisher","unstructured":"Dinh, N.T., Hoang, V.T.: Recent advances of captcha security analysis: a short literature review. Procedia Comput. Sci. 218, 2550\u20132562 (2023). https:\/\/doi.org\/10.1016\/j.procs.2023.01.229, International Conference on Machine Learning and Data Engineering","DOI":"10.1016\/j.procs.2023.01.229"},{"key":"8_CR16","series-title":"Studies in Computational Intelligence","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1007\/978-981-16-6597-4_3","volume-title":"Cyber Security: Issues and Current Trends","author":"N Dutta","year":"2022","unstructured":"Dutta, N., Jadav, N., Tanwar, S., Sarma, H.K.D., Pricop, E.: TOR\u2014the onion router. In: Cyber Security: Issues and Current Trends. SCI, vol. 995, pp. 37\u201355. Springer, Singapore (2022). https:\/\/doi.org\/10.1007\/978-981-16-6597-4_3"},{"key":"8_CR17","doi-asserted-by":"crossref","unstructured":"Girardi, C., Ricca, F., Tonella, P.: Web crawlers compared. Int. J. Web Inf. Syst. 285\u201394 (2006)","DOI":"10.1108\/17440080680000104"},{"key":"8_CR18","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"137","DOI":"10.1007\/3-540-61996-8_37","volume-title":"Information Hiding","author":"DM Goldschlag","year":"1996","unstructured":"Goldschlag, D.M., Reed, M.G., Syverson, P.F.: Hiding routing information. In: Anderson, R. (ed.) IH 1996. LNCS, vol. 1174, pp. 137\u2013150. Springer, Heidelberg (1996). https:\/\/doi.org\/10.1007\/3-540-61996-8_37"},{"key":"8_CR19","unstructured":"Greenberg, A.: Hacker lexicon: what is the dark web? Wired. http:\/\/www.wired.com\/2014\/11\/hacker-lexicon-whats-dark-web [dostkep 6.02. 2017] (2014)"},{"key":"8_CR20","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"221","DOI":"10.1007\/978-3-319-39381-0_20","volume-title":"Human Aspects of Information Security, Privacy, and Trust","author":"G Kalpakis","year":"2016","unstructured":"Kalpakis, G., et al.: Interactive discovery and retrieval of web resources containing home made explosive recipes. In: Tryfonas, T. (ed.) HAS 2016. LNCS, vol. 9750, pp. 221\u2013233. Springer, Cham (2016). https:\/\/doi.org\/10.1007\/978-3-319-39381-0_20"},{"key":"8_CR21","first-page":"32","volume":"1","author":"R Khare","year":"2004","unstructured":"Khare, R., Cutting, D., Sitaker, K., Rifkin, A.: Nutch: a flexible and scalable open-source web search engine. Oregon State Univ. 1, 32\u201332 (2004)","journal-title":"Oregon State Univ."},{"issue":"2","key":"8_CR22","doi-asserted-by":"publisher","first-page":"1107","DOI":"10.1007\/s11831-021-09608-4","volume":"29","author":"M Kumar","year":"2022","unstructured":"Kumar, M., Jindal, M.K., Kumar, M.: A systematic survey on CAPTCHA recognition: types, creation and breaking techniques. Arch. Comput. Methods Eng. 29(2), 1107\u20131136 (2022)","journal-title":"Arch. Comput. Methods Eng."},{"key":"8_CR23","doi-asserted-by":"publisher","unstructured":"Liu, B., Liu, B., Menczer, F.: Web crawling. In: Web Data Mining: Exploring Hyperlinks, Contents, and Usage Data, pp. 311\u2013362 (2011). https:\/\/doi.org\/10.1007\/978-3-642-19460-3","DOI":"10.1007\/978-3-642-19460-3"},{"key":"8_CR24","unstructured":"Moshe, N., Brizinov, S., Onitza-Klugman, R., Efimov, K.: Exploiting URL parsers: The good, bad, and inconsistent. Tech. rep., Technical report. 2021 (2022). https:\/\/security.claroty.com\/URLparserconfusion"},{"key":"8_CR25","series-title":"Lecture Notes in Networks and Systems","doi-asserted-by":"publisher","first-page":"187","DOI":"10.1007\/978-981-15-0146-3_19","volume-title":"Inventive Communication and Computational Technologies","author":"PS Narayanan","year":"2020","unstructured":"Narayanan, P.S., Ani, R., King, A.T.L.: TorBot: open source intelligence tool for Dark Web. In: Ranganathan, G., Chen, J., Rocha, \u00c1. (eds.) Inventive Communication and Computational Technologies. LNNS, vol. 89, pp. 187\u2013195. Springer, Singapore (2020). https:\/\/doi.org\/10.1007\/978-981-15-0146-3_19"},{"issue":"2","key":"8_CR26","doi-asserted-by":"publisher","first-page":"160","DOI":"10.1177\/10439862231159774","volume":"39","author":"FT Ngo","year":"2023","unstructured":"Ngo, F.T., Marcum, C., Belshaw, S.: The Dark web: what is it, how to access it, and why we need to study it. J. Contemp. Crim. Justice 39(2), 160\u2013166 (2023). https:\/\/doi.org\/10.1177\/10439862231159774","journal-title":"J. Contemp. Crim. Justice"},{"key":"8_CR27","doi-asserted-by":"publisher","first-page":"153","DOI":"10.1007\/978-3-662-10874-1_7","volume":"2004","author":"G Pant","year":"2004","unstructured":"Pant, G., Srinivasan, P., Menczer, F.: Crawling the web. Web Dyn. 2004, 153\u2013178 (2004)","journal-title":"Web Dyn."},{"key":"8_CR28","doi-asserted-by":"publisher","unstructured":"Prabha, C., Mittal, A.: Dark web: a review on the deeper side of the web. In: 2022 OPJU International Technology Conference on Emerging Technologies for Sustainable Development (OTCON), pp.\u00a01\u20136 (2023). https:\/\/doi.org\/10.1109\/OTCON56053.2023.10113989","DOI":"10.1109\/OTCON56053.2023.10113989"},{"issue":"11","key":"8_CR29","doi-asserted-by":"publisher","DOI":"10.1016\/j.heliyon.2023.e22269","volume":"9","author":"R Raman","year":"2023","unstructured":"Raman, R., Kumar Nair, V., Nedungadi, P., Ray, I., Achuthan, K.: Darkweb research: past, present, and future trends and mapping to sustainable development goals. Heliyon 9(11), e22269 (2023)","journal-title":"Heliyon"},{"key":"8_CR30","doi-asserted-by":"publisher","unstructured":"Ristoski, P.: Web mining. In: Rokach, L., Maimon, O., Shmueli, E. (eds.) Machine Learning for Data Science Handbook, pp. 447\u2013467. Springer, Cham (2023). https:\/\/doi.org\/10.1007\/978-3-031-24628-9_20","DOI":"10.1007\/978-3-031-24628-9_20"},{"key":"8_CR31","doi-asserted-by":"publisher","unstructured":"Yang, D., Thiengburanathum, P.: Scalability and robustness testing for open source web crawlers. In: 2021 Joint International Conference on Digital Arts, Media and Technology with ECTI Northern Section Conference on Electrical, Electronics, Computer and Telecommunication Engineering, pp. 197\u2013201 (2021). https:\/\/doi.org\/10.1109\/ECTIDAMTNCON51128.2021.9425701","DOI":"10.1109\/ECTIDAMTNCON51128.2021.9425701"}],"container-title":["Lecture Notes in Computer Science","Computer Security \u2013 ESORICS 2024"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-70890-9_8","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,5]],"date-time":"2024-09-05T09:26:48Z","timestamp":1725528408000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-70890-9_8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024]]},"ISBN":["9783031708893","9783031708909"],"references-count":31,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-70890-9_8","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024]]},"assertion":[{"value":"6 September 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ESORICS","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Symposium on Research in Computer Security","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Bydgoszcz","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Poland","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"16 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"20 September 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"esorics2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/esorics2024.org","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}