{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,10,29]],"date-time":"2024-10-29T11:15:02Z","timestamp":1730200502896,"version":"3.28.0"},"reference-count":30,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2015,11]]},"DOI":"10.1109\/bibm.2015.7359781","type":"proceedings-article","created":{"date-parts":[[2015,12,17]],"date-time":"2015-12-17T22:00:00Z","timestamp":1450389600000},"page":"756-763","source":"Crossref","is-referenced-by-count":3,"title":["A highly parallel next-generation DNA sequencing data analysis pipeline in Hadoop"],"prefix":"10.1109","author":[{"given":"Kareem S.","family":"Aggour","sequence":"first","affiliation":[]},{"given":"Vijay S.","family":"Kumar","sequence":"additional","affiliation":[]},{"given":"Dipen P.","family":"Sangurdekar","sequence":"additional","affiliation":[]},{"given":"Lee A.","family":"Newberg","sequence":"additional","affiliation":[]},{"given":"Chinnappa D.","family":"Kodira","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1038\/nature09744"},{"key":"ref10","first-page":"1297","article-title":"The Genome Analysis Toolkit: A MapReduce Framework for Analyzing Next-generation Sequencing Data. Genome Res","volume":"20","author":"mckenna","year":"2010"},{"key":"ref11","first-page":"308","article-title":"dbSNP: the NCBI database of genetic variation. Nucleic Acids Research","volume":"29","author":"sherry","year":"2001"},{"key":"ref12","first-page":"568","author":"koboldt","year":"2012","journal-title":"VarScan 2 somatic mutation and copy number alteration discovery in cancer by exome sequencing Genome Res"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btt305"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btt183"},{"journal-title":"DNA Sequencing Not Quite HPC yet","year":"0","author":"lockwood","key":"ref15"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1007\/s10877-005-3463-y"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1186\/1471-2105-11-S12-S1"},{"key":"ref18","article-title":"Scalable Genome Resequencing with ADAM and Avocado","author":"nothaft","year":"2015","journal-title":"Technical Report No UCB\/EECS"},{"key":"ref19","article-title":"Accelerating Data-Intensive Genome Analysis in the Cloud","author":"mohamed","year":"2013","journal-title":"Proc of the 5th Intl Conf on Bioinformatics and Comp Biology"},{"key":"ref28","article-title":"GenBase: A Complex Analytics Genomics Benchmark","author":"taft","year":"2013","journal-title":"Tech Report No MIT-CSAI L-TR-2013&#x2013;028"},{"journal-title":"Hadoop The Definitive Guide O'reilly Media","year":"2012","author":"white","key":"ref4"},{"key":"ref27","article-title":"Genomic Applications on Cray Supercomputers: Next Generation Sequencing Workflow","author":"kandel","year":"2013","journal-title":"Cray User Group Conference"},{"key":"ref3","first-page":"183","article-title":"Efficient Next-Generation DNA Sequencing in Hadoop","author":"aggour","year":"2014","journal-title":"Proc of the 6th Intl Conf on Bioinformatics and Comp Biology"},{"journal-title":"FastQC Babraham Bioinformatics Institute","year":"0","key":"ref6"},{"key":"ref29","first-page":"56","article-title":"1000 Genomes Project Consortium, An integrated map of genetic variation from 1,092 human genomes","volume":"491","author":"abecasis","year":"2012","journal-title":"Nature"},{"journal-title":"GE Healthcare SeqWright &#x2013; DNA Sequencing Molecular Biology and Custom Genomic Analysis Services","year":"0","key":"ref5"},{"key":"ref8","first-page":"357","article-title":"Fast gapped-read alignment with Bowtie 2, Nat Methods","volume":"9","author":"langmead","year":"2012"},{"key":"ref7","first-page":"589","article-title":"Fast and accurate long-read alignment with Burrows-Wheeler transform, Bioinformatics","volume":"26","author":"li","year":"2010"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pbio.1002195"},{"key":"ref9","first-page":"2078","article-title":"1000 Genome Project Data Processing Subgroup, The Sequence Alignment\/Map format and SAMtools, Bioinformatics","volume":"25","author":"li","year":"2009"},{"journal-title":"The DNA Data Deluge IEEE Spectrum issue on Biomedical devices","year":"2013","author":"schatz","key":"ref1"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/MDAT.2013.2293757"},{"journal-title":"Proc of 11th IEEE Intl Workshop on High Performance Comp Biology","article-title":"Investigating Memory Optimization of Hash-index for Next Generation Sequencing on Multi-core Architecture","year":"2012","key":"ref22"},{"journal-title":"HPC Software Libraries for Next-Gen Sequencing Analytics &#x2013; Aluru Lab","year":"0","key":"ref21"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1093\/bioinformatics\/btv179"},{"key":"ref23","article-title":"Building Highly-Optimized, Low-Latency Pipelines for Genomic Data Analysis","author":"diao","year":"2015","journal-title":"Proc Int'l Conf Innovative Data Systems Research (CIDR)"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/HPEC.2014.7040949"},{"key":"ref25","article-title":"Engineering a High-performance SNP detection pipeline","author":"rengasamy","year":"2015","journal-title":"Tech Report"}],"event":{"name":"2015 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)","start":{"date-parts":[[2015,11,9]]},"location":"Washington, DC, USA","end":{"date-parts":[[2015,11,12]]}},"container-title":["2015 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7350074\/7359638\/07359781.pdf?arnumber=7359781","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,3,25]],"date-time":"2017-03-25T02:02:05Z","timestamp":1490407325000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7359781\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,11]]},"references-count":30,"URL":"https:\/\/doi.org\/10.1109\/bibm.2015.7359781","relation":{},"subject":[],"published":{"date-parts":[[2015,11]]}}}