{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,5]],"date-time":"2026-03-05T15:34:17Z","timestamp":1772724857137,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":58,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,6,21]]},"DOI":"10.1145\/3695053.3731056","type":"proceedings-article","created":{"date-parts":[[2025,6,20]],"date-time":"2025-06-20T16:46:17Z","timestamp":1750437977000},"page":"1834-1847","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":2,"title":["NMP-PaK: Near-Memory Processing Acceleration of Scalable De Novo Genome Assembly"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-6748-2890","authenticated-orcid":false,"given":"Heewoo","family":"Kim","sequence":"first","affiliation":[{"name":"University of Colorado, Boulder, CO, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8688-1843","authenticated-orcid":false,"given":"Sanjay Sri Vallabh","family":"Singapuram","sequence":"additional","affiliation":[{"name":"University of Michigan, Ann Arbor, MI, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5360-5159","authenticated-orcid":false,"given":"Haojie","family":"Ye","sequence":"additional","affiliation":[{"name":"University of Michigan, Ann Arbor, MI, USA"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-1267-5024","authenticated-orcid":false,"given":"Joseph","family":"Izraelevitz","sequence":"additional","affiliation":[{"name":"University of Colorado, Boulder, CO, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7845-2187","authenticated-orcid":false,"given":"Trevor","family":"Mudge","sequence":"additional","affiliation":[{"name":"University of Michigan, Ann Arbor, MI, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4188-4650","authenticated-orcid":false,"given":"Ronald","family":"Dreslinski","sequence":"additional","affiliation":[{"name":"University of Michigan, Ann Arbor, MI, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2457-4119","authenticated-orcid":false,"given":"Nishil","family":"Talati","sequence":"additional","affiliation":[{"name":"University of Michigan, Ann Arbor, MI, USA"}]}],"member":"320","published-online":{"date-parts":[[2025,6,20]]},"reference":[{"key":"e_1_3_3_1_2_2","unstructured":"2009. Homo sapiens genome. https:\/\/www.ncbi.nlm.nih.gov\/datasets\/genome\/GCF_000001405.13\/."},{"key":"e_1_3_3_1_3_2","unstructured":"2020. 980 PRO. https:\/\/semiconductor.samsung.com\/consumer-storage\/internal-ssd\/980pro\/."},{"key":"e_1_3_3_1_4_2","doi-asserted-by":"publisher","DOI":"10.1109\/DAC18072.2020.9218653"},{"key":"e_1_3_3_1_5_2","doi-asserted-by":"publisher","DOI":"10.1145\/3458817.3476212"},{"key":"e_1_3_3_1_6_2","doi-asserted-by":"crossref","unstructured":"Jonathan Butler Iain MacCallum Michael Kleber Ilya\u00a0A Shlyakhter Matthew\u00a0K Belmonte Eric\u00a0S Lander Chad Nusbaum and David\u00a0B Jaffe. 2008. ALLPATHS: de novo assembly of whole-genome shotgun microreads. Genome research 18 5 (2008) 810\u2013820.","DOI":"10.1101\/gr.7337908"},{"key":"e_1_3_3_1_7_2","doi-asserted-by":"publisher","DOI":"10.1145\/3470496.3527436"},{"key":"e_1_3_3_1_8_2","doi-asserted-by":"publisher","unstructured":"Trevor\u00a0E. Carlson Wim Heirman Stijn Eyerman Ibrahim Hur and Lieven Eeckhout. 2014. An Evaluation of High-Level Mechanistic Core Models. ACM Transactions on Architecture and Code Optimization (TACO) Article 5 (2014) 23\u00a0pages. 10.1145\/2629677","DOI":"10.1145\/2629677"},{"key":"e_1_3_3_1_9_2","doi-asserted-by":"crossref","unstructured":"Haoyu Cheng Gregory\u00a0T Concepcion Xiaowen Feng Haowen Zhang and Heng Li. 2021. Haplotype-resolved de novo assembly using phased assembly graphs with hifiasm. Nature methods 18 2 (2021) 170\u2013175.","DOI":"10.1038\/s41592-020-01056-5"},{"key":"e_1_3_3_1_10_2","doi-asserted-by":"publisher","DOI":"10.1109\/HOTCHIPS.2019.8875680"},{"key":"e_1_3_3_1_11_2","doi-asserted-by":"crossref","unstructured":"Juechu Dong Xueshen Liu Harisankar Sadasivan Sriranjani Sitaraman and Satish Narayanasamy. 2024. mm2-gb: GPU Accelerated Minimap2 for Long Read DNA Mapping. bioRxiv (2024) 2024\u201303.","DOI":"10.1101\/2024.03.23.586366"},{"key":"e_1_3_3_1_12_2","doi-asserted-by":"crossref","unstructured":"Mohamed\u00a0S Donia Peter Cimermancic Christopher\u00a0J Schulze Laura C\u00a0Wieland Brown John Martin Makedonka Mitreva Jon Clardy Roger\u00a0G Linington and Michael\u00a0A Fischbach. 2014. A systematic analysis of biosynthetic gene clusters in the human microbiome reveals a common family of antibiotics. Cell 158 6 (2014) 1402\u20131414.","DOI":"10.1016\/j.cell.2014.08.032"},{"key":"e_1_3_3_1_13_2","doi-asserted-by":"crossref","unstructured":"Bar\u0131\u015f Ekim Bonnie Berger and Rayan Chikhi. 2021. Minimizer-space de Bruijn graphs: Whole-genome assembly of long reads in minutes on a personal computer. Cell systems 12 10 (2021) 958\u2013968.","DOI":"10.1016\/j.cels.2021.08.009"},{"key":"e_1_3_3_1_14_2","doi-asserted-by":"publisher","DOI":"10.1145\/3470496.3527432"},{"key":"e_1_3_3_1_15_2","doi-asserted-by":"crossref","unstructured":"Daichi Fujiki Xiaowei Wang Arun Subramaniyan and Reetuparna Das. 2021. In-\/near-memory Computing. Synthesis Lectures on Computer Architecture 16 2 (2021) 1\u2013140.","DOI":"10.1007\/978-3-031-01772-8_1"},{"key":"e_1_3_3_1_16_2","doi-asserted-by":"publisher","DOI":"10.1145\/2807591.2807664"},{"key":"e_1_3_3_1_17_2","doi-asserted-by":"publisher","DOI":"10.1109\/SC.2018.00013"},{"key":"e_1_3_3_1_18_2","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA59077.2024.00054"},{"key":"e_1_3_3_1_19_2","doi-asserted-by":"crossref","unstructured":"Priyanka Ghosh Sriram Krishnamoorthy and Ananth Kalyanaraman. 2020. Pakman: a scalable algorithm for generating genomic contigs on distributed memory machines. IEEE Transactions on Parallel and Distributed Systems 32 5 (2020) 1191\u20131209.","DOI":"10.1109\/TPDS.2020.3043241"},{"key":"e_1_3_3_1_20_2","doi-asserted-by":"crossref","unstructured":"Juan G\u00f3mez-Luna Izzat El\u00a0Hajj Ivan Fernandez Christina Giannoula Geraldo\u00a0F Oliveira and Onur Mutlu. 2022. Benchmarking a new paradigm: Experimental analysis and characterization of a real processing-in-memory system. IEEE Access 10 (2022) 52565\u201352608.","DOI":"10.1109\/ACCESS.2022.3174101"},{"key":"e_1_3_3_1_21_2","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2018.00091"},{"key":"e_1_3_3_1_22_2","doi-asserted-by":"publisher","DOI":"10.1145\/3579371.3589060"},{"key":"e_1_3_3_1_23_2","doi-asserted-by":"publisher","DOI":"10.1109\/FCCM.2019.00027"},{"key":"e_1_3_3_1_24_2","doi-asserted-by":"crossref","unstructured":"Alexey Gurevich Vladislav Saveliev Nikolay Vyahhi and Glenn Tesler. 2013. QUAST: quality assessment tool for genome assemblies. Bioinformatics 29 8 (2013) 1072\u20131075.","DOI":"10.1093\/bioinformatics\/btt086"},{"key":"e_1_3_3_1_25_2","doi-asserted-by":"crossref","unstructured":"Weichun Huang Leping Li Jason\u00a0R Myers and Gabor\u00a0T Marth. 2012. ART: a next-generation sequencing read simulator. Bioinformatics 28 4 (2012) 593\u2013594.","DOI":"10.1093\/bioinformatics\/btr708"},{"key":"e_1_3_3_1_26_2","doi-asserted-by":"publisher","DOI":"10.1109\/HiPC.2013.6799107"},{"key":"e_1_3_3_1_27_2","doi-asserted-by":"crossref","unstructured":"Saurabh Kalikar Chirag Jain Md Vasimuddin and Sanchit Misra. 2022. Accelerating minimap2 for long-read sequencing applications on modern CPUs. Nature Computational Science 2 2 (2022) 78\u201383.","DOI":"10.1038\/s43588-022-00201-8"},{"key":"e_1_3_3_1_28_2","first-page":"790","volume-title":"ISCA","author":"Ke Liu","year":"2020","unstructured":"Liu Ke, Udit Gupta, Benjamin\u00a0Youngjae Cho, David Brooks, Vikas Chandra, Utku Diril, Amin Firoozshahian, Kim Hazelwood, Bill Jia, Hsien-Hsin\u00a0S Lee, Meng Li, Bert Maher, Dheevatsa Mudigere, Maxim Naumov, Martin Schatz, Mikhail Smelyanskiy, Xiaodong Wang, Brandon Reagen, Carole-Jean Wu, Mark Hempstead, and Xuan Zhang. 2020. Recnmp: Accelerating personalized recommendation with near-memory processing. In ISCA. 790\u2013803."},{"key":"e_1_3_3_1_29_2","doi-asserted-by":"publisher","DOI":"10.1109\/ISLPED58423.2023.10244420"},{"key":"e_1_3_3_1_30_2","doi-asserted-by":"publisher","DOI":"10.1109\/HCS52781.2021.9567191"},{"key":"e_1_3_3_1_31_2","doi-asserted-by":"crossref","unstructured":"Yoongu Kim Weikun Yang and Onur Mutlu. 2015. Ramulator: A fast and extensible DRAM simulator. IEEE Computer architecture letters 15 1 (2015) 45\u201349.","DOI":"10.1109\/LCA.2015.2414456"},{"key":"e_1_3_3_1_32_2","doi-asserted-by":"crossref","unstructured":"Sergey Koren Brian\u00a0P Walenz Konstantin Berlin Jason\u00a0R Miller Nicholas\u00a0H Bergman and Adam\u00a0M Phillippy. 2017. Canu: scalable and accurate long-read assembly via adaptive k-mer weighting and repeat separation. Genome research 27 5 (2017) 722\u2013736.","DOI":"10.1101\/gr.215087.116"},{"key":"e_1_3_3_1_33_2","doi-asserted-by":"publisher","DOI":"10.1145\/3352460.3358284"},{"key":"e_1_3_3_1_34_2","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA52012.2021.00013"},{"key":"e_1_3_3_1_35_2","doi-asserted-by":"crossref","unstructured":"Dinghua Li Chi-Man Liu Ruibang Luo Kunihiko Sadakane and Tak-Wah Lam. 2015. MEGAHIT: an ultra-fast single-node solution for large and complex metagenomics assembly via succinct de Bruijn graph. Bioinformatics 31 10 (2015) 1674\u20131676.","DOI":"10.1093\/bioinformatics\/btv033"},{"key":"e_1_3_3_1_36_2","doi-asserted-by":"publisher","unstructured":"Heng Li. 2018. Minimap2: pairwise alignment for nucleotide sequences. Bioinformatics 34 18 (05 2018) 3094\u20133100. 10.1093\/bioinformatics\/bty191 arXiv:https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/34\/18\/3094\/48919122\/bioinformatics_34_18_3094.pdf","DOI":"10.1093\/bioinformatics\/bty191"},{"key":"e_1_3_3_1_37_2","doi-asserted-by":"publisher","DOI":"10.1145\/2897937.2898064"},{"key":"e_1_3_3_1_38_2","doi-asserted-by":"publisher","DOI":"10.1109\/HPCC.2011.29"},{"key":"e_1_3_3_1_39_2","doi-asserted-by":"crossref","unstructured":"Patrick\u00a0J Meaney Lawrence\u00a0D Curley Glenn\u00a0D Gilda Mark\u00a0R Hodges Daniel\u00a0J Buerkle Robert\u00a0D Siegl and Roger\u00a0K Dong. 2015. The IBM z13 memory subsystem for big data. IBM Journal of Research and Development 59 4\/5 (2015) 4\u20131.","DOI":"10.1147\/JRD.2015.2429031"},{"key":"e_1_3_3_1_40_2","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA59077.2024.00050"},{"key":"e_1_3_3_1_41_2","doi-asserted-by":"crossref","unstructured":"Yu Peng Henry\u00a0CM Leung Siu-Ming Yiu and Francis\u00a0YL Chin. 2012. IDBA-UD: a de novo assembler for single-cell and metagenomic sequencing data with highly uneven depth. Bioinformatics 28 11 (2012) 1420\u20131428.","DOI":"10.1093\/bioinformatics\/bts174"},{"key":"e_1_3_3_1_42_2","doi-asserted-by":"publisher","DOI":"10.1016\/B978-0-12-817497-5.00028-8"},{"key":"e_1_3_3_1_43_2","doi-asserted-by":"crossref","unstructured":"Harisankar Sadasivan Milos Maric Eric Dawson Vishanth Iyer Johnny Israeli and Satish Narayanasamy. 2023. Accelerating Minimap2 for accurate long read alignment on GPUs. Journal of biotechnology and biomedicine 6 1 (2023) 13.","DOI":"10.1101\/2022.03.09.483575"},{"key":"e_1_3_3_1_44_2","doi-asserted-by":"crossref","unstructured":"Itai Sharon and Jillian\u00a0F Banfield. 2013. Genomes from metagenomics. Science 342 6162 (2013) 1057\u20131058.","DOI":"10.1126\/science.1247023"},{"key":"e_1_3_3_1_45_2","doi-asserted-by":"crossref","unstructured":"Jared\u00a0T Simpson Kim Wong Shaun\u00a0D Jackman Jacqueline\u00a0E Schein Steven\u00a0JM Jones and Inan\u00e7 Birol. 2009. ABySS: a parallel assembler for short read sequence data. Genome research 19 6 (2009) 1117\u20131123.","DOI":"10.1101\/gr.089532.108"},{"key":"e_1_3_3_1_46_2","doi-asserted-by":"publisher","DOI":"10.1109\/ISSCC42615.2023.10067810"},{"key":"e_1_3_3_1_47_2","doi-asserted-by":"crossref","unstructured":"Aleksandra Swiercz Wojciech Frohmberg Michal Kierzynka Pawel Wojciechowski Piotr Zurkowski Jan Badura Artur Laskowski Marta Kasprzak and Jacek Blazewicz. 2018. GRASShopPER\u2014An algorithm for de novo assembly based on GPU alignments. PloS one 13 8 (2018) e0202355.","DOI":"10.1371\/journal.pone.0202355"},{"key":"e_1_3_3_1_48_2","doi-asserted-by":"crossref","unstructured":"Nishil Talati Saransh Gupta Pravin Mane and Shahar Kvatinsky. 2016. Logic design within memristive memories using memristor-aided loGIC (MAGIC). TNANO 15 4 (2016) 635\u2013650.","DOI":"10.1109\/TNANO.2016.2570248"},{"key":"e_1_3_3_1_49_2","doi-asserted-by":"publisher","DOI":"10.1109\/MICRO56248.2022.00089"},{"key":"e_1_3_3_1_50_2","doi-asserted-by":"publisher","DOI":"10.1145\/3470496.3527437"},{"key":"e_1_3_3_1_51_2","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPS.2019.00041"},{"key":"e_1_3_3_1_52_2","doi-asserted-by":"crossref","unstructured":"Herbert\u00a0W Virgin and John\u00a0A Todd. 2011. Metagenomics and personalized medicine. Cell 147 1 (2011) 44\u201356.","DOI":"10.1016\/j.cell.2011.09.009"},{"key":"e_1_3_3_1_53_2","doi-asserted-by":"crossref","unstructured":"Lingxi Wu Minxuan Zhou Weihong Xu Ashish Venkat Tajana Rosing and Kevin Skadron. 2024. Abakus: Accelerating k-mer Counting with Storage Technology. ACM Transactions on Architecture and Code Optimization 21 1 (2024) 1\u201326.","DOI":"10.1145\/3632952"},{"key":"e_1_3_3_1_54_2","doi-asserted-by":"publisher","DOI":"10.1145\/3688351.3689154"},{"key":"e_1_3_3_1_55_2","doi-asserted-by":"publisher","DOI":"10.1145\/3352460.3358318"},{"key":"e_1_3_3_1_56_2","doi-asserted-by":"crossref","unstructured":"Daniel\u00a0R Zerbino and Ewan Birney. 2008. Velvet: algorithms for de novo short read assembly using de Bruijn graphs. Genome research 18 5 (2008) 821\u2013829.","DOI":"10.1101\/gr.074492.107"},{"key":"e_1_3_3_1_57_2","doi-asserted-by":"publisher","DOI":"10.1145\/3620666.3651331"},{"key":"e_1_3_3_1_58_2","doi-asserted-by":"publisher","DOI":"10.1109\/PACT52795.2021.00022"},{"key":"e_1_3_3_1_59_2","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA56546.2023.10071005"}],"event":{"name":"ISCA '25: Proceedings of the 52nd Annual International Symposium on Computer Architecture","location":"Tokyo Japan","acronym":"SIGARCH '25","sponsor":["SIGARCH ACM Special Interest Group on Computer Architecture"]},"container-title":["Proceedings of the 52nd Annual International Symposium on Computer Architecture"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3695053.3731056","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,21]],"date-time":"2025-06-21T11:05:24Z","timestamp":1750503924000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3695053.3731056"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,6,20]]},"references-count":58,"alternative-id":["10.1145\/3695053.3731056","10.1145\/3695053"],"URL":"https:\/\/doi.org\/10.1145\/3695053.3731056","relation":{},"subject":[],"published":{"date-parts":[[2025,6,20]]},"assertion":[{"value":"2025-06-20","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}