{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,11]],"date-time":"2026-03-11T11:51:25Z","timestamp":1773229885894,"version":"3.50.1"},"reference-count":24,"publisher":"Oxford University Press (OUP)","issue":"8","license":[{"start":{"date-parts":[[2024,7,30]],"date-time":"2024-07-30T00:00:00Z","timestamp":1722297600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"DOI":"10.13039\/100000028","name":"Semiconductor Research Corporation","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100000028","id-type":"DOI","asserted-by":"publisher"}]},{"name":"European Union\u2019s Horizon Programme for Research and Innovation"},{"DOI":"10.13039\/501100001711","name":"Swiss National Science Foundation","doi-asserted-by":"publisher","award":["200021_213084"],"award-info":[{"award-number":["200021_213084"]}],"id":[{"id":"10.13039\/501100001711","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,8,2]]},"abstract":"<jats:title>Abstract<\/jats:title>\n               <jats:sec>\n                  <jats:title>Summary<\/jats:title>\n                  <jats:p>Raw nanopore signals can be analyzed while they are being generated, a process known as real-time analysis. Real-time analysis of raw signals is essential to utilize the unique features that nanopore sequencing provides, enabling the early stopping of the sequencing of a read or the entire sequencing run based on the analysis. The state-of-the-art mechanism, RawHash, offers the first hash-based efficient and accurate similarity identification between raw signals and a reference genome by quickly matching their hash values. In this work, we introduce RawHash2, which provides major improvements over RawHash, including more sensitive quantization and chaining algorithms, weighted mapping decisions, frequency filters to reduce ambiguous seed hits, minimizers for hash-based sketching, and support for the R10.4 flow cell version and POD5 and SLOW5 file formats. Compared to RawHash, RawHash2 provides better F1 accuracy (on average by 10.57% and up to 20.25%) and better throughput (on average by 4.0\u00d7 and up to 9.9\u00d7) than RawHash.<\/jats:p>\n               <\/jats:sec>\n               <jats:sec>\n                  <jats:title>Availability and implementation<\/jats:title>\n                  <jats:p>RawHash2 is available at https:\/\/github.com\/CMU-SAFARI\/RawHash. We also provide the scripts to fully reproduce our results on our GitHub page.<\/jats:p>\n               <\/jats:sec>","DOI":"10.1093\/bioinformatics\/btae478","type":"journal-article","created":{"date-parts":[[2024,7,30]],"date-time":"2024-07-30T19:49:06Z","timestamp":1722368946000},"source":"Crossref","is-referenced-by-count":15,"title":["RawHash2: mapping raw nanopore signals using hash-based seeding and adaptive quantization"],"prefix":"10.1093","volume":"40","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-6548-7863","authenticated-orcid":false,"given":"Can","family":"Firtina","sequence":"first","affiliation":[{"name":"Department of Information Technology and Electrical Engineering, ETH Zurich , Zurich 8092, Switzerland"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-2378-6737","authenticated-orcid":false,"given":"Melina","family":"Soysal","sequence":"additional","affiliation":[{"name":"Department of Information Technology and Electrical Engineering, ETH Zurich , Zurich 8092, Switzerland"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2581-8637","authenticated-orcid":false,"given":"Jo\u00ebl","family":"Lindegger","sequence":"additional","affiliation":[{"name":"Department of Information Technology and Electrical Engineering, ETH Zurich , Zurich 8092, Switzerland"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0075-2312","authenticated-orcid":false,"given":"Onur","family":"Mutlu","sequence":"additional","affiliation":[{"name":"Department of Information Technology and Electrical Engineering, ETH Zurich , Zurich 8092, Switzerland"}]}],"member":"286","published-online":{"date-parts":[[2024,7,30]]},"reference":[{"key":"2024082005161958700_btae478-B1","doi-asserted-by":"crossref","first-page":"403","DOI":"10.1016\/S0022-2836(05)80360-2","article-title":"Basic local alignment search tool","volume":"215","author":"Altschul","year":"1990","journal-title":"J Mol Biol"},{"key":"2024082005161958700_btae478-B2","doi-asserted-by":"crossref","first-page":"298","DOI":"10.1186\/s13059-021-02511-y","article-title":"SquiggleNet: real-time, direct classification of nanopore signals","volume":"22","author":"Bao","year":"2021","journal-title":"Genome Biol"},{"key":"2024082005161958700_btae478-B3","first-page":"535","article-title":"SquiggleFilter: an accelerator for portable virus detection","author":"Dunn","year":"2021","journal-title":"MICRO, New York, NY, USA,"},{"key":"2024082005161958700_btae478-B4","doi-asserted-by":"crossref","first-page":"17504","DOI":"10.1038\/s41598-019-53739-5","article-title":"Real-Time selective sequencing with RUBRIC: read until with basecall and reference-informed criteria","volume":"9","author":"Edwards","year":"2019","journal-title":"Sci Rep"},{"key":"2024082005161958700_btae478-B5","doi-asserted-by":"crossref","first-page":"i297","DOI":"10.1093\/bioinformatics\/btad272","article-title":"RawHash: enabling fast and accurate real-time analysis of raw nanopore signals for large genomes","volume":"39(Supplement_1)","author":"Firtina","year":"2023","journal-title":"Bioinformatics"},{"key":"2024082005161958700_btae478-B6","doi-asserted-by":"crossref","DOI":"10.1093\/nargab\/lqad004","article-title":"BLEND: a fast, memory-efficient and accurate mechanism to find fuzzy seed matches in genome analysis","author":"Firtina","year":"2023","journal-title":"NAR Genomics and Bioinformatics"},{"key":"2024082005161958700_btae478-B7","doi-asserted-by":"crossref","first-page":"1026","DOI":"10.1038\/s41587-021-01147-4","article-title":"Fast nanopore sequencing data analysis with SLOW5","volume":"40","author":"Gamaarachchi","year":"2022","journal-title":"Nat Biotechnol"},{"key":"2024082005161958700_btae478-B8","doi-asserted-by":"crossref","first-page":"338","DOI":"10.1038\/nbt.4060","article-title":"Nanopore sequencing and assembly of a human genome with ultra-long reads","volume":"36","author":"Jain","year":"2018","journal-title":"Nat Biotechnol"},{"key":"2024082005161958700_btae478-B9","doi-asserted-by":"crossref","first-page":"431","DOI":"10.1038\/s41587-020-0731-9","article-title":"Targeted nanopore sequencing by real-time mapping of raw electrical signal with UNCALLED","volume":"39","author":"Kovaka","year":"2021","journal-title":"Nat Biotechnol"},{"key":"2024082005161958700_btae478-B10","author":"Kovaka","year":"2024"},{"key":"2024082005161958700_btae478-B11","doi-asserted-by":"crossref","first-page":"3094","DOI":"10.1093\/bioinformatics\/bty191","article-title":"Minimap2: pairwise alignment for nucleotide sequences","volume":"34","author":"Li","year":"2018","journal-title":"Bioinformatics"},{"key":"2024082005161958700_btae478-B12","author":"Lindegger","year":"2023"},{"key":"2024082005161958700_btae478-B13","doi-asserted-by":"crossref","first-page":"751","DOI":"10.1038\/nmeth.3930","article-title":"Real-time selective sequencing using nanopore technology","volume":"13","author":"Loose","year":"2016","journal-title":"Nat Methods"},{"key":"2024082005161958700_btae478-B14","doi-asserted-by":"crossref","first-page":"i66","DOI":"10.1093\/bioinformatics\/btad243","article-title":"Coriolis: enabling metagenomic classification on lightweight mobile devices","volume":"39(Supplement_1)","author":"Mikalsen","year":"2023","journal-title":"Bioinformatics"},{"key":"2024082005161958700_btae478-B15","doi-asserted-by":"crossref","first-page":"442","DOI":"10.1038\/s41587-020-00746-x","article-title":"Readfish enables targeted nanopore sequencing of gigabase-sized genomes","volume":"39","author":"Payne","year":"2021","journal-title":"Nat Biotechnol"},{"key":"2024082005161958700_btae478-B16","doi-asserted-by":"crossref","first-page":"3363","DOI":"10.1093\/bioinformatics\/bth408","article-title":"Reducing storage requirements for biological sequence comparison","volume":"20","author":"Roberts","year":"2004","journal-title":"Bioinformatics"},{"key":"2024082005161958700_btae478-B17","doi-asserted-by":"crossref","first-page":"45","DOI":"10.26502\/acbr.50170318","article-title":"Rapid real-time squiggle classification for read until using RawMap","volume":"7","author":"Sadasivan","year":"2023","journal-title":"Arch Clin Biomed Res"},{"key":"2024082005161958700_btae478-B18","doi-asserted-by":"crossref","first-page":"2080","DOI":"10.1101\/gr.275648.121","article-title":"Effective sequence similarity detection with strobemers","volume":"31","author":"Sahlin","year":"2021","journal-title":"Genome Res"},{"key":"2024082005161958700_btae478-B19","doi-asserted-by":"crossref","first-page":"31","DOI":"10.1186\/s12859-023-05151-0","article-title":"DeepSelectNet: deep neural network based selective sequencing for oxford nanopore sequencing","volume":"24","author":"Senanayake","year":"2023","journal-title":"BMC Bioinform"},{"key":"2024082005161958700_btae478-B20","doi-asserted-by":"crossref","first-page":"1542","DOI":"10.1093\/bib\/bby017","article-title":"Nanopore sequencing technology and tools for genome assembly: computational analysis of the current state, bottlenecks and future directions","volume":"20","author":"Senol Cali","year":"2019","journal-title":"Brief Bioinform"},{"key":"2024082005161958700_btae478-B21","doi-asserted-by":"crossref","first-page":"giad046","DOI":"10.1093\/gigascience\/giad046","article-title":"Efficient real-time selective genome sequencing on resource-constrained devices","volume":"12","author":"Shih","year":"2023","journal-title":"Gigascience"},{"key":"2024082005161958700_btae478-B22","doi-asserted-by":"crossref","first-page":"i287","DOI":"10.1093\/bioinformatics\/btae213","article-title":"Sigmoni: classification of nanopore signal with a compressed pangenome index","volume":"40(Supplement_1)","author":"Shivakumar","year":"2024","journal-title":"Bioinformatics"},{"key":"2024082005161958700_btae478-B23","doi-asserted-by":"crossref","first-page":"i153","DOI":"10.1093\/bioinformatics\/btac223","article-title":"ReadBouncer: precise and scalable adaptive sampling for nanopore sequencing","volume":"38(Supplement_1)","author":"Ulrich","year":"2022","journal-title":"Bioinformatics"},{"key":"2024082005161958700_btae478-B24","doi-asserted-by":"crossref","DOI":"10.1093\/bioinformatics\/btab264","article-title":"Real-time mapping of nanopore raw signals","author":"Zhang","year":"2021","journal-title":"Bioinformatics"}],"container-title":["Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/academic.oup.com\/bioinformatics\/advance-article-pdf\/doi\/10.1093\/bioinformatics\/btae478\/58689561\/btae478.pdf","content-type":"application\/pdf","content-version":"am","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/40\/8\/btae478\/58856590\/btae478.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/40\/8\/btae478\/58856590\/btae478.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,8,20]],"date-time":"2024-08-20T05:17:08Z","timestamp":1724131028000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article\/doi\/10.1093\/bioinformatics\/btae478\/7723993"}},"subtitle":[],"editor":[{"given":"Inanc","family":"Birol","sequence":"additional","affiliation":[]}],"short-title":[],"issued":{"date-parts":[[2024,7,30]]},"references-count":24,"journal-issue":{"issue":"8","published-print":{"date-parts":[[2024,8,2]]}},"URL":"https:\/\/doi.org\/10.1093\/bioinformatics\/btae478","relation":{},"ISSN":["1367-4811"],"issn-type":[{"value":"1367-4811","type":"electronic"}],"subject":[],"published-other":{"date-parts":[[2024,8]]},"published":{"date-parts":[[2024,7,30]]},"article-number":"btae478"}}