{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,5]],"date-time":"2026-01-05T18:13:33Z","timestamp":1767636813933,"version":"3.48.0"},"reference-count":33,"publisher":"Oxford University Press (OUP)","issue":"1","license":[{"start":{"date-parts":[[2025,12,3]],"date-time":"2025-12-03T00:00:00Z","timestamp":1764720000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026,1,2]]},"abstract":"<jats:title>Abstract<\/jats:title>\n                  <jats:sec>\n                    <jats:title>Summary<\/jats:title>\n                    <jats:p>We propose a new algorithm, \u201cinterval hashing,\u201d which distinguishes identical k-mers arising from different repeat sequences, particularly in complex repeat arrays such as alpha satellite HORs. We implement this algorithm as a fork of minimap2, named mm2-ivh. In local assembly of alpha satellite HORs, mm2-ivh accurately reconstructs more haplotypes than assemblers using standard minimizers.<\/jats:p>\n                  <\/jats:sec>\n                  <jats:sec>\n                    <jats:title>Availability and implementation<\/jats:title>\n                    <jats:p>mm2-ivh is available under the MIT license at https:\/\/github.com\/ocxtal\/mm2-ivh and runs on common Unix-compatible systems.<\/jats:p>\n                  <\/jats:sec>","DOI":"10.1093\/bioinformatics\/btaf648","type":"journal-article","created":{"date-parts":[[2025,12,1]],"date-time":"2025-12-01T12:39:01Z","timestamp":1764592741000},"source":"Crossref","is-referenced-by-count":0,"title":["mm2-ivh: simple and precise overlap detection in alpha satellite HORs with interval hashing"],"prefix":"10.1093","volume":"42","author":[{"ORCID":"https:\/\/orcid.org\/0009-0004-0727-6824","authenticated-orcid":false,"given":"Hajime","family":"Suzuki","sequence":"first","affiliation":[{"name":"Division of Genome Analysis Platform Development, National Cancer Center Research Institute , Tokyo 104-0045,","place":["Japan"]}]},{"given":"Masahiro","family":"Sugawa","sequence":"additional","affiliation":[{"name":"Division of Genome Analysis Platform Development, National Cancer Center Research Institute , Tokyo 104-0045,","place":["Japan"]}]},{"given":"Yoshitaka","family":"Sakamoto","sequence":"additional","affiliation":[{"name":"Division of Genome Analysis Platform Development, National Cancer Center Research Institute , Tokyo 104-0045,","place":["Japan"]}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6144-5845","authenticated-orcid":false,"given":"Yuichi","family":"Shiraishi","sequence":"additional","affiliation":[{"name":"Division of Genome Analysis Platform Development, National Cancer Center Research Institute , Tokyo 104-0045,","place":["Japan"]}]}],"member":"286","published-online":{"date-parts":[[2025,12,3]]},"reference":[{"key":"2026010509223903400_btaf648-B1","doi-asserted-by":"crossref","first-page":"2107","DOI":"10.1101\/gr.276871.122","article-title":"Fast and accurate mapping of long reads to complete genome assemblies with VerityMap","volume":"32","author":"Bzikadze","year":"2022","journal-title":"Genome Res"},{"key":"2026010509223903400_btaf648-B2","doi-asserted-by":"crossref","first-page":"1309","DOI":"10.1038\/s41587-020-0582-4","article-title":"Automated assembly of centromeres from ultra-long error-prone reads","volume":"38","author":"Bzikadze","year":"2020","journal-title":"Nat Biotechnol"},{"key":"2026010509223903400_btaf648-B3","doi-asserted-by":"crossref","first-page":"1346","DOI":"10.1038\/s41592-023-01970-4","article-title":"UniAligner: a parameter-free framework for fast sequence alignment","volume":"20","author":"Bzikadze","year":"2023","journal-title":"Nat Methods"},{"key":"2026010509223903400_btaf648-B4","doi-asserted-by":"crossref","first-page":"863","DOI":"10.1101\/gr.279308.124","article-title":"RAmbler resolves complex repeats in human chromosomes 8, 19, and X","volume":"35","author":"Chakravarty","year":"2025","journal-title":"Genome Res"},{"key":"2026010509223903400_btaf648-B5","doi-asserted-by":"crossref","first-page":"170","DOI":"10.1038\/s41592-020-01056-5","article-title":"Haplotype-resolved de novo assembly using phased assembly graphs with hifiasm","volume":"18","author":"Cheng","year":"2021","journal-title":"Nat Methods"},{"key":"2026010509223903400_btaf648-B6","doi-asserted-by":"crossref","first-page":"btac714","DOI":"10.1093\/bioinformatics\/btac714","article-title":"GAVISUNK: genome assembly validation via inter-SUNK distances in oxford nanopore reads","volume":"39","author":"Dishuck","year":"2023","journal-title":"Bioinformatics"},{"key":"2026010509223903400_btaf648-B7","doi-asserted-by":"crossref","first-page":"i93","DOI":"10.1093\/bioinformatics\/btaa454","article-title":"The string decomposition problem and its applications to centromere analysis and assembly","volume":"36","author":"Dvorkina","year":"2020","journal-title":"Bioinformatics"},{"key":"2026010509223903400_btaf648-B8","doi-asserted-by":"crossref","first-page":"110842","DOI":"10.1016\/j.ygeno.2024.110842","article-title":"Advancements in long-read genome sequencing technologies and algorithms","volume":"116","author":"Espinosa","year":"2024","journal-title":"Genomics"},{"key":"2026010509223903400_btaf648-B9","doi-asserted-by":"crossref","first-page":"i297","DOI":"10.1093\/bioinformatics\/btad272","article-title":"RawHash: enabling fast and accurate real-time analysis of raw nanopore signals for large genomes","volume":"39","author":"Firtina","year":"2023","journal-title":"Bioinformatics"},{"key":"2026010509223903400_btaf648-B10","doi-asserted-by":"crossref","first-page":"705","DOI":"10.1038\/s41592-022-01457-8","article-title":"Long-read mapping to repetitive reference sequences using Winnowmap2","volume":"19","author":"Jain","year":"2022","journal-title":"Nat Methods"},{"key":"2026010509223903400_btaf648-B11","doi-asserted-by":"crossref","first-page":"338","DOI":"10.1038\/nbt.4060","article-title":"Nanopore sequencing and assembly of a human genome with ultra-long reads","volume":"36","author":"Jain","year":"2018","journal-title":"Nat Biotechnol"},{"key":"2026010509223903400_btaf648-B12","doi-asserted-by":"crossref","first-page":"311","DOI":"10.1093\/bioinformatics\/btw620","article-title":"OMBlast: alignment tool for optical mapping using a seed-and-extend approach","volume":"33","author":"Leung","year":"2017","journal-title":"Bioinformatics"},{"key":"2026010509223903400_btaf648-B13","doi-asserted-by":"crossref","first-page":"2103","DOI":"10.1093\/bioinformatics\/btw152","article-title":"Minimap and miniasm: fast mapping and de novo assembly for noisy long sequences","volume":"32","author":"Li","year":"2016","journal-title":"Bioinformatics"},{"key":"2026010509223903400_btaf648-B14","doi-asserted-by":"crossref","first-page":"3094","DOI":"10.1093\/bioinformatics\/bty191","article-title":"Minimap2: pairwise alignment for nucleotide sequences","volume":"34","author":"Li","year":"2018","journal-title":"Bioinformatics"},{"key":"2026010509223903400_btaf648-B15","doi-asserted-by":"crossref","first-page":"430","DOI":"10.1038\/s41586-025-09140-6","article-title":"Complex genetic variation in nearly complete human genomes","volume":"644","author":"Logsdon","year":"2025","journal-title":"Nature"},{"key":"2026010509223903400_btaf648-B16","doi-asserted-by":"crossref","first-page":"92","DOI":"10.3390\/genes14010092","article-title":"The dynamic structure and rapid evolution of human centromeric satellite DNA","volume":"14","author":"Logsdon","year":"2022","journal-title":"Genes (Basel)"},{"key":"2026010509223903400_btaf648-B17","doi-asserted-by":"crossref","first-page":"136","DOI":"10.1038\/s41586-024-07278-3","article-title":"The variation and evolution of complete human centromeres","volume":"629","author":"Logsdon","year":"2024","journal-title":"Nature"},{"key":"2026010509223903400_btaf648-B18","doi-asserted-by":"crossref","first-page":"101","DOI":"10.1038\/s41586-021-03420-7","article-title":"The structure, function and evolution of a complete human chromosome 8","volume":"593","author":"Logsdon","year":"2021","journal-title":"Nature"},{"key":"2026010509223903400_btaf648-B19","doi-asserted-by":"crossref","first-page":"440","DOI":"10.1093\/bioinformatics\/18.3.440","article-title":"PatternHunter: faster and more sensitive homology search","volume":"18","author":"Ma","year":"2002","journal-title":"Bioinformatics"},{"key":"2026010509223903400_btaf648-B20","doi-asserted-by":"crossref","first-page":"79","DOI":"10.1038\/s41586-020-2547-7","article-title":"Telomere-to-telomere assembly of a complete human X chromosome","volume":"585","author":"Miga","year":"2020","journal-title":"Nature"},{"key":"2026010509223903400_btaf648-B21","doi-asserted-by":"crossref","first-page":"3492","DOI":"10.1093\/bioinformatics\/btw397","article-title":"ntHash: recursive nucleotide hashing","volume":"32","author":"Mohamadi","year":"2016","journal-title":"Bioinformatics"},{"key":"2026010509223903400_btaf648-B22","doi-asserted-by":"crossref","first-page":"44","DOI":"10.1126\/science.abj6987","article-title":"The complete sequence of a human genome","volume":"376","author":"Nurk","year":"2022","journal-title":"Science"},{"key":"2026010509223903400_btaf648-B23","doi-asserted-by":"crossref","first-page":"1474","DOI":"10.1038\/s41587-023-01662-6","article-title":"Telomere-to-telomere assembly of diploid chromosomes with Verkko","volume":"41","author":"Rautiainen","year":"2023","journal-title":"Nat Biotechnol"},{"key":"2026010509223903400_btaf648-B24","doi-asserted-by":"crossref","first-page":"3363","DOI":"10.1093\/bioinformatics\/bth408","article-title":"Reducing storage requirements for biological sequence comparison","volume":"20","author":"Roberts","year":"2004","journal-title":"Bioinformatics"},{"key":"2026010509223903400_btaf648-B25","doi-asserted-by":"crossref","first-page":"2080","DOI":"10.1101\/gr.275648.121","article-title":"Effective sequence similarity detection with strobemers","volume":"31","author":"Sahlin","year":"2021","journal-title":"Genome Res"},{"key":"2026010509223903400_btaf648-B26","doi-asserted-by":"crossref","first-page":"682","DOI":"10.1093\/bioinformatics\/btz663","article-title":"Fast and accurate correction of optical mapping data via spaced seeds","volume":"36","author":"Salmela","year":"2020","journal-title":"Bioinformatics"},{"year":"2024","author":"Stanojevic","key":"2026010509223903400_btaf648-B27","doi-asserted-by":"publisher","DOI":"10.1101\/2024.05.18.594796"},{"key":"2026010509223903400_btaf648-B28","doi-asserted-by":"crossref","first-page":"4309","DOI":"10.3390\/ijms22094309","article-title":"Sequence, chromatin and evolution of satellite DNA","volume":"22","author":"Thakur","year":"2021","journal-title":"IJMS"},{"key":"2026010509223903400_btaf648-B29","doi-asserted-by":"crossref","first-page":"1155","DOI":"10.1038\/s41587-019-0217-9","article-title":"Accurate circular consensus long-read sequencing improves variant detection and assembly of a human genome","volume":"37","author":"Wenger","year":"2019","journal-title":"Nat Biotechnol"},{"key":"2026010509223903400_btaf648-B30","doi-asserted-by":"crossref","first-page":"192","DOI":"10.1016\/0168-9525(87)90232-0","article-title":"Hierarchical order in chromosome-specific human alpha satellite DNA","volume":"3","author":"Willard","year":"1987","journal-title":"Trends Genet"},{"key":"2026010509223903400_btaf648-B31","doi-asserted-by":"crossref","first-page":"363","DOI":"10.1016\/0022-2836(80)90277-6","article-title":"Sequence definition and organization of a human repeated DNA","volume":"142","author":"Wu","year":"1980","journal-title":"J Mol Biol"},{"key":"2026010509223903400_btaf648-B32","doi-asserted-by":"crossref","first-page":"745","DOI":"10.1038\/s41422-023-00849-5","article-title":"The complete and fully-phased diploid genome of a male Han Chinese","volume":"33","author":"Yang","year":"2023","journal-title":"Cell Res"},{"key":"2026010509223903400_btaf648-B33","doi-asserted-by":"crossref","first-page":"1209","DOI":"10.1101\/gr.279763.124","article-title":"Fast sequence alignment for centromeres with RaMA","volume":"35","author":"Zhang","year":"2025","journal-title":"Genome Res"}],"container-title":["Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/academic.oup.com\/bioinformatics\/advance-article-pdf\/doi\/10.1093\/bioinformatics\/btaf648\/65728363\/btaf648.pdf","content-type":"application\/pdf","content-version":"am","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/42\/1\/btaf648\/65728363\/btaf648.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/42\/1\/btaf648\/65728363\/btaf648.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,1,5]],"date-time":"2026-01-05T14:22:52Z","timestamp":1767622972000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article\/doi\/10.1093\/bioinformatics\/btaf648\/8363875"}},"subtitle":[],"editor":[{"given":"Can","family":"Alkan","sequence":"additional","affiliation":[]}],"short-title":[],"issued":{"date-parts":[[2025,12,3]]},"references-count":33,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2026,1,2]]}},"URL":"https:\/\/doi.org\/10.1093\/bioinformatics\/btaf648","relation":{},"ISSN":["1367-4803","1367-4811"],"issn-type":[{"type":"print","value":"1367-4803"},{"type":"electronic","value":"1367-4811"}],"subject":[],"published-other":{"date-parts":[[2026,1]]},"published":{"date-parts":[[2025,12,3]]},"article-number":"btaf648"}}