{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,9]],"date-time":"2026-06-09T08:39:49Z","timestamp":1780994389374,"version":"3.54.1"},"publisher-location":"New York, NY, USA","reference-count":51,"publisher":"ACM","funder":[{"name":"NSF &#x28;National Science Foundation&#x29;","award":["2313062"],"award-info":[{"award-number":["2313062"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2026,3,22]]},"DOI":"10.1145\/3779212.3790227","type":"proceedings-article","created":{"date-parts":[[2026,3,10]],"date-time":"2026-03-10T13:55:26Z","timestamp":1773150926000},"page":"1880-1896","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":1,"title":["Static Analysis for Efficient Streaming Tokenization"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-4523-3401","authenticated-orcid":false,"given":"Angela W.","family":"Li","sequence":"first","affiliation":[{"name":"Rice University, Houston, Texas, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-3156-0637","authenticated-orcid":false,"given":"Yudi","family":"Yang","sequence":"additional","affiliation":[{"name":"Rice University, Houston, Texas, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1209-7738","authenticated-orcid":false,"given":"Konstantinos","family":"Mamouras","sequence":"additional","affiliation":[{"name":"Rice University, Houston, Texas, USA"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2026,3,22]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"Ullman","author":"Aho Alfred V.","year":"2006","unstructured":"Alfred V. Aho, Monica S. Lam, Ravi Sethi, and Jeffrey D. Ullman. 2006. Compilers: Principles, Techniques and Tools (2nd ed.). Addison Wesley."},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","unstructured":"Miguel Angel Garc\u00eda and Gonzalo Camarillo. 2008. Extensible Markup Language (XML) Format Extension for Representing Copy Control Attributes in Resource Lists. RFC 5364. https:\/\/doi.org\/10.17487\/RFC5364","DOI":"10.17487\/RFC5364"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-43144-4_5"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.scico.2015.09.002"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","unstructured":"Tim Bray. 2017. The JavaScript Object Notation (JSON) Data Interchange Format. RFC 8259. https:\/\/doi.org\/10.17487\/RFC8259","DOI":"10.17487\/RFC8259"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1145\/321239.321249"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1145\/176454.176487"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/3703595.3705884"},{"key":"e_1_3_2_1_9_1","volume-title":"Ragel State Machine Compiler. https:\/\/www.colm.net\/open-source\/ragel\/. [Online","author":"Networks Colm","year":"2026","unstructured":"Colm Networks. 2021. Ragel State Machine Compiler. https:\/\/www.colm.net\/open-source\/ragel\/. [Online; accessed January 25, 2026]."},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1145\/366663.366704"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-25379-9_11"},{"key":"e_1_3_2_1_12_1","unstructured":"Geoffroy Couprie. 2025. Nom Eating Data Byte by Byte. https:\/\/docs.rs\/nom\/latest\/nom\/"},{"key":"e_1_3_2_1_13_1","volume-title":"Regular Expression Matching in the Wild. https:\/\/swtch.com\/ rsc\/regexp\/regexp3.html. [Online","author":"Cox Russ","year":"2026","unstructured":"Russ Cox. 2010. Regular Expression Matching in the Wild. https:\/\/swtch.com\/ rsc\/regexp\/regexp3.html. [Online; accessed January 25, 2026]."},{"key":"e_1_3_2_1_14_1","unstructured":"Alex Crichton and Andrew Gallant. 2024. regex. https:\/\/crates.io\/crates\/regex"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/SPW53761.2021.00022"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1145\/3497775.3503694"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1145\/3725843.3756052"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1145\/3617232.3624848"},{"key":"e_1_3_2_1_19_1","unstructured":"Google. [n.d.]. GitHub - google\/re2: RE2 is a fast safe thread-friendly alternative to backtracking regular expression engines like those used in PCRE Perl and Python. It is a C library. https:\/\/github.com\/google\/re2"},{"key":"e_1_3_2_1_20_1","unstructured":"Christopher Groskopf and contributors. 2016. csvkit. https:\/\/csvkit.readthedocs.org\/"},{"key":"e_1_3_2_1_21_1","unstructured":"Philip Hazel. 2015. Web Server Access Logs. https:\/\/www.kaggle.com\/datasets\/eliasdabbas\/web-server-access-logs"},{"key":"e_1_3_2_1_22_1","unstructured":"Intenet Assigned Numbers Authority. 1993. Definition of Tab-separated-values (tsv). https:\/\/www.iana.org\/assignments\/media-types\/text\/tab-separated-values"},{"key":"e_1_3_2_1_23_1","volume-title":"Fast Scanner Generator for Java with Full Unicode Support. https:\/\/jflex.de\/. [Online","year":"2024","unstructured":"JFlex. 2024. Fast Scanner Generator for Java with Full Unicode Support. https:\/\/jflex.de\/. [Online; accessed May 22, 2024]."},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1145\/364175.364185"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1145\/3519939.3523456"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/3586044"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/3689771"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.14778\/3778092.3778109"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1145\/3720498"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS49936.2021.00079"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1145\/3632934"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1145\/3656461"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","unstructured":"Paul V. Mockapetris. 1987. Domain Names - Implementation and Specification. RFC 1035. https:\/\/doi.org\/10.17487\/RFC1035","DOI":"10.17487\/RFC1035"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1145\/2541940.2541988"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.22152\/programming-journal.org\/2024\/8\/3"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.85.8.2444"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","unstructured":"Roberto Polli Erik Wilde and Eemeli Aro. 2024. YAML Media Type. RFC 9512. https:\/\/doi.org\/10.17487\/RFC9512","DOI":"10.17487\/RFC9512"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1145\/276393.276394"},{"key":"e_1_3_2_1_39_1","volume-title":"A high-performance C regex library and a lexical analyzer generator. https:\/\/www.genivia.com\/doc\/reflex\/html\/. [Online","author":"van Engelen Robert","year":"2024","unstructured":"Robert van Engelen. 2016. RE\/flex: A high-performance C regex library and a lexical analyzer generator. https:\/\/www.genivia.com\/doc\/reflex\/html\/. [Online; accessed May 22, 2024]."},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","unstructured":"Scott Rose Matt Larson Dan Massey Rob Austein and Roy Arends. 2005. Resource Records for the DNS Security Extensions. RFC 4034. https:\/\/doi.org\/10.17487\/RFC4034","DOI":"10.17487\/RFC4034"},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.1016\/S0022-0000(70)80006-X"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","unstructured":"Yakov Shafranovich. 2005. Common Format and MIME Type for Comma-Separated Values (CSV) Files. RFC 4180. https:\/\/doi.org\/10.17487\/RFC4180","DOI":"10.17487\/RFC4180"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4302-0244-8_16"},{"key":"e_1_3_2_1_44_1","unstructured":"Geoffry Song. 2024. plex a parser and lexer generator. https:\/\/crates.io\/crates\/plex"},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.4230\/LIPIcs.ITP.2023.27"},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10817-023-09667-1"},{"key":"e_1_3_2_1_47_1","volume-title":"Flex: The Fast Lexical Analyzer. https:\/\/github.com\/westes\/flex. [Online","author":"Paxson Vern","year":"1987","unstructured":"Vern Paxson. 1987. Flex: The Fast Lexical Analyzer. https:\/\/github.com\/westes\/flex. [Online; accessed May 22, 2024]."},{"key":"e_1_3_2_1_48_1","doi-asserted-by":"publisher","DOI":"10.1145\/3620665.3640412"},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"publisher","DOI":"10.1145\/3695053.3731106"},{"key":"e_1_3_2_1_50_1","doi-asserted-by":"publisher","DOI":"10.1109\/ISSRE59848.2023.00071"},{"key":"e_1_3_2_1_51_1","doi-asserted-by":"publisher","DOI":"10.1145\/3636501.3636959"}],"event":{"name":"ASPLOS '26: 31st ACM International Conference on Architectural Support for Programming Languages and Operating Systems","location":"Pittsburgh PA USA","sponsor":["SIGOPS ACM Special Interest Group on Operating Systems","SIGPLAN ACM Special Interest Group on Programming Languages","SIGARCH ACM Special Interest Group on Computer Architecture","SIGBED ACM Special Interest Group on Embedded Systems"]},"container-title":["Proceedings of the 31st ACM International Conference on Architectural Support for Programming Languages and Operating Systems, Volume 2"],"original-title":[],"deposited":{"date-parts":[[2026,3,15]],"date-time":"2026-03-15T14:04:45Z","timestamp":1773583485000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3779212.3790227"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,3,22]]},"references-count":51,"alternative-id":["10.1145\/3779212.3790227","10.1145\/3779212"],"URL":"https:\/\/doi.org\/10.1145\/3779212.3790227","relation":{},"subject":[],"published":{"date-parts":[[2026,3,22]]},"assertion":[{"value":"2026-03-22","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}