{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,27]],"date-time":"2026-05-27T18:00:17Z","timestamp":1779904817830,"version":"3.53.1"},"publisher-location":"New York, NY, USA","reference-count":10,"publisher":"ACM","license":[{"start":{"date-parts":[[2017,8,4]],"date-time":"2017-08-04T00:00:00Z","timestamp":1501804800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2017,8,4]]},"DOI":"10.1145\/3097983.3098111","type":"proceedings-article","created":{"date-parts":[[2017,8,4]],"date-time":"2017-08-04T18:35:54Z","timestamp":1501871754000},"page":"1007-1015","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":42,"title":["An Alternative to NCD for Large Sequences, Lempel-Ziv Jaccard Distance"],"prefix":"10.1145","author":[{"given":"Edward","family":"Raff","sequence":"first","affiliation":[{"name":"Laboratory for Physical Sciences, Columbia, MD, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Charles","family":"Nicholas","sequence":"additional","affiliation":[{"name":"University of Maryland, Baltimore County, Baltimore, MD, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2017,8,4]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"Detecting Malware with Information Complexity. (2","author":"Alshahwan Nadia","year":"2015","unstructured":"Nadia Alshahwan , Earl T Barr , David Clark , and George Danezis 2015. Detecting Malware with Information Complexity. (2 2015 ). showURL%http:\/\/arxiv.org\/abs\/1502.07661 Nadia Alshahwan, Earl T Barr, David Clark, and George Danezis 2015. Detecting Malware with Information Complexity. (2 2015). showURL%http:\/\/arxiv.org\/abs\/1502.07661"},{"key":"e_1_3_2_1_2_1","volume-title":"Drebin: Effective and Explainable Detection of Android Malware in Your Pocket. Symposium on Network and Distributed System Security (NDSS)","author":"Arp Daniel","year":"2014","unstructured":"Daniel Arp , Michael Spreitzenbarth , Hubner Malte , Hugo Gascon , and Konrad Rieck . 2014 . Drebin: Effective and Explainable Detection of Android Malware in Your Pocket. Symposium on Network and Distributed System Security (NDSS) February (2014), 23--26. https:\/\/doi.org\/10.14722\/ndss.2014.23247 Daniel Arp, Michael Spreitzenbarth, Hubner Malte, Hugo Gascon, and Konrad Rieck. 2014. Drebin: Effective and Explainable Detection of Android Malware in Your Pocket. Symposium on Network and Distributed System Security (NDSS) February (2014), 23--26. https:\/\/doi.org\/10.14722\/ndss.2014.23247"},{"key":"e_1_3_2_1_3_1","volume-title":"Automated Classification and Analysis of Internet Malware Proceedings of the 10th International Conference on Recent Advances in Intrusion Detection (RAID'07)","author":"Bailey Michael","year":"2007","unstructured":"Michael Bailey , Jon Oberheide , Jon Andersen , Z Morley Mao , Farnam Jahanian , and Jose Nazario . 2007 . Automated Classification and Analysis of Internet Malware Proceedings of the 10th International Conference on Recent Advances in Intrusion Detection (RAID'07) . Springer-Verlag, Berlin, Heidelberg, 178--197. http:\/\/dl.acm.org\/citation.cfm?id=1776434.1776449 Michael Bailey, Jon Oberheide, Jon Andersen, Z Morley Mao, Farnam Jahanian, and Jose Nazario. 2007. Automated Classification and Analysis of Internet Malware Proceedings of the 10th International Conference on Recent Advances in Intrusion Detection (RAID'07). Springer-Verlag, Berlin, Heidelberg, 178--197. http:\/\/dl.acm.org\/citation.cfm?id=1776434.1776449"},{"key":"e_1_3_2_1_4_1","volume-title":"On normalized compression distance and large malware. Journal of Computer Virology and Hacking Techniques","author":"Borbely Rebecca Schuller","year":"2015","unstructured":"Rebecca Schuller Borbely . 2015. On normalized compression distance and large malware. Journal of Computer Virology and Hacking Techniques ( 2015 ), 1--8. 1007\/978-3-642-04342-0_7 Rebecca Schuller Borbely. 2015. On normalized compression distance and large malware. Journal of Computer Virology and Hacking Techniques (2015), 1--8. 1007\/978-3-642-04342-0_7"},{"key":"e_1_3_2_1_5_1","volume-title":"Daly (Eds.)","volume":"10","author":"Tran Nicholas","year":"2007","unstructured":"Nicholas Tran . 2007 . The normalized compression distance and image distinguishability Proc. SPIE 6492, Human Vision and Electronic Imaging XII, Bernice E. Rogowitz, Thrasyvoulos N. Pappas, and Scott J . Daly (Eds.) , Vol. Vol. 64921D. https:\/\/doi.org\/ 10 .1117\/12.704334 Nicholas Tran. 2007. The normalized compression distance and image distinguishability Proc. SPIE 6492, Human Vision and Electronic Imaging XII, Bernice E. Rogowitz, Thrasyvoulos N. Pappas, and Scott J. Daly (Eds.), Vol. Vol. 64921D. https:\/\/doi.org\/10.1117\/12.704334"},{"key":"e_1_3_2_1_6_1","article-title":"Analyzing Worms and Network Traffic Using Compression","volume":"15","author":"Wehner Stephanie","year":"2007","unstructured":"Stephanie Wehner . 2007 . Analyzing Worms and Network Traffic Using Compression . J. Comput. Secur. , Vol. 15 , 3 (8 2007), 303--320. ISSN0926-227X http:\/\/dl.acm.org\/citation.cfm?id=1370628.1370630 Stephanie Wehner. 2007. Analyzing Worms and Network Traffic Using Compression. J. Comput. Secur., Vol. 15, 3 (8 2007), 303--320. ISSN0926-227X http:\/\/dl.acm.org\/citation.cfm?id=1370628.1370630","journal-title":"J. Comput. Secur."},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11416-006-0028-7"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1109\/MSP.2008.126"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.1977.1055714"},{"key":"e_1_3_2_1_10_1","article-title":"Compression of individual sequences via variable-rate coding","volume":"24","author":"Ziv Jacob","year":"1978","unstructured":"Jacob Ziv and Abraham Lempel 1978 . Compression of individual sequences via variable-rate coding . IEEE Transactions on Information Theory Vol. 24 , 5 (9 1978), 530--536. ISSN0018-9448 https:\/\/doi.org\/10.1109\/TIT.1978.1055934 Jacob Ziv and Abraham Lempel 1978. Compression of individual sequences via variable-rate coding. IEEE Transactions on Information Theory Vol. 24, 5 (9 1978), 530--536. ISSN0018-9448 https:\/\/doi.org\/10.1109\/TIT.1978.1055934","journal-title":"IEEE Transactions on Information Theory"}],"event":{"name":"KDD '17: The 23rd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining","location":"Halifax NS Canada","acronym":"KDD '17","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGKDD ACM Special Interest Group on Knowledge Discovery in Data"]},"container-title":["Proceedings of the 23rd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3097983.3098111","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3097983.3098111","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T03:30:26Z","timestamp":1750217426000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3097983.3098111"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017,8,4]]},"references-count":10,"alternative-id":["10.1145\/3097983.3098111","10.1145\/3097983"],"URL":"https:\/\/doi.org\/10.1145\/3097983.3098111","relation":{},"subject":[],"published":{"date-parts":[[2017,8,4]]},"assertion":[{"value":"2017-08-04","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}