{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,13]],"date-time":"2026-04-13T14:10:02Z","timestamp":1776089402150,"version":"3.50.1"},"reference-count":14,"publisher":"Oxford University Press (OUP)","issue":"14","license":[{"start":{"date-parts":[[2018,3,1]],"date-time":"2018-03-01T00:00:00Z","timestamp":1519862400000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by-nc\/4.0\/"}],"funder":[{"DOI":"10.13039\/501100001691","name":"JSPS","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001691","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001691","name":"KAKENHI","doi-asserted-by":"crossref","award":["JP16K07464"],"award-info":[{"award-number":["JP16K07464"]}],"id":[{"id":"10.13039\/501100001691","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100001691","name":"KAKENHI","doi-asserted-by":"crossref","award":["JP17J06457"],"award-info":[{"award-number":["JP17J06457"]}],"id":[{"id":"10.13039\/501100001691","id-type":"DOI","asserted-by":"crossref"}]},{"name":"Platform Project for Supporting Drug Discovery and Life Science Research","award":["JP17am0101110"],"award-info":[{"award-number":["JP17am0101110"]}]},{"name":"Platform Project for Supporting Drug Discovery and Life Science Research","award":["JP17am0101108"],"award-info":[{"award-number":["JP17am0101108"]}]},{"DOI":"10.13039\/100009619","name":"AMED","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100009619","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2018,7,15]]},"abstract":"<jats:title>Abstract<\/jats:title><jats:sec><jats:title>Summary<\/jats:title><jats:p>We report an update for the MAFFT multiple sequence alignment program to enable parallel calculation of large numbers of sequences. The G-INS-1 option of MAFFT was recently reported to have higher accuracy than other methods for large data, but this method has been impractical for most large-scale analyses, due to the requirement of large computational resources. We introduce a scalable variant, G-large-INS-1, which has equivalent accuracy to G-INS-1 and is applicable to 50\u00a0000 or more sequences.<\/jats:p><\/jats:sec><jats:sec><jats:title>Availability and implementation<\/jats:title><jats:p>This feature is available in MAFFT versions 7.355 or later at https:\/\/mafft.cbrc.jp\/alignment\/software\/mpi.html.<\/jats:p><\/jats:sec><jats:sec><jats:title>Supplementary information<\/jats:title><jats:p>Supplementary data are available at Bioinformatics online.<\/jats:p><\/jats:sec>","DOI":"10.1093\/bioinformatics\/bty121","type":"journal-article","created":{"date-parts":[[2018,2,28]],"date-time":"2018-02-28T12:20:25Z","timestamp":1519820425000},"page":"2490-2492","source":"Crossref","is-referenced-by-count":944,"title":["Parallelization of MAFFT for large-scale multiple sequence alignments"],"prefix":"10.1093","volume":"34","author":[{"given":"Tsukasa","family":"Nakamura","sequence":"first","affiliation":[{"name":"Department of Computational Biology and Medical Sciences, Graduate School of Frontier Sciences, University of Tokyo, Chiba, Japan"},{"name":"Artificial Intelligence Research Center (AIRC), National Institute of Advanced Industrial Science and Technology (AIST), Tokyo, Japan"}]},{"given":"Kazunori D","family":"Yamada","sequence":"additional","affiliation":[{"name":"Artificial Intelligence Research Center (AIRC), National Institute of Advanced Industrial Science and Technology (AIST), Tokyo, Japan"},{"name":"Graduate School of Information Sciences, Tohoku University, Sendai, Japan"}]},{"given":"Kentaro","family":"Tomii","sequence":"additional","affiliation":[{"name":"Department of Computational Biology and Medical Sciences, Graduate School of Frontier Sciences, University of Tokyo, Chiba, Japan"},{"name":"Artificial Intelligence Research Center (AIRC), National Institute of Advanced Industrial Science and Technology (AIST), Tokyo, Japan"},{"name":"Biotechnology Research Institute for Drug Discovery (BRD), AIST, Tokyo, Japan"},{"name":"AIST-Tokyo Tech Real World Big-Data Computation Open Innovation Laboratory (RWBC-OIL), Tokyo, Japan"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4133-8393","authenticated-orcid":false,"given":"Kazutaka","family":"Katoh","sequence":"additional","affiliation":[{"name":"Artificial Intelligence Research Center (AIRC), National Institute of Advanced Industrial Science and Technology (AIST), Tokyo, Japan"},{"name":"Research Institute for Microbial Diseases, Osaka University, Suita, Japan"}]}],"member":"286","published-online":{"date-parts":[[2018,3,1]]},"reference":[{"key":"2023012713012005500_bty121-B1","doi-asserted-by":"crossref","first-page":"26.","DOI":"10.1186\/s13015-015-0057-1","article-title":"Instability in progressive multiple sequence alignment algorithms","volume":"10","author":"Boyce","year":"2015","journal-title":"Algorithms Mol Biol"},{"key":"2023012713012005500_bty121-B2","doi-asserted-by":"crossref","first-page":"W389","DOI":"10.1093\/nar\/gkv332","article-title":"JPred4: a protein secondary structure prediction server","volume":"43","author":"Drozdetskiy","year":"2015","journal-title":"Nucleic Acids Res"},{"key":"2023012713012005500_bty121-B3","doi-asserted-by":"crossref","first-page":"814","DOI":"10.1093\/bioinformatics\/btv592","article-title":"Using de novo protein structure predictions to measure the quality of very large multiple sequence alignments","volume":"32","author":"Fox","year":"2016","journal-title":"Bioinformatics"},{"key":"2023012713012005500_bty121-B4","doi-asserted-by":"crossref","first-page":"169","DOI":"10.1016\/j.jbiotec.2017.06.1198","article-title":"25 years of serving the community with ribosomal RNA gene reference databases and tools","volume":"261","author":"Gl\u00f6ckner","year":"2017","journal-title":"J. Biotechnol"},{"key":"2023012713012005500_bty121-B5","doi-asserted-by":"crossref","first-page":"3826","DOI":"10.1093\/bioinformatics\/btw558","article-title":"MSAProbs-MPI: parallel multiple sequence aligner for distributed-memory systems","volume":"32","author":"Gonz\u00e1lez-Dom\u00ednguez","year":"2016","journal-title":"Bioinformatics"},{"key":"2023012713012005500_bty121-B6","doi-asserted-by":"crossref","first-page":"41553.","DOI":"10.1038\/srep41553","article-title":"QuickProbs 2: towards rapid construction of high-quality alignments of large protein families","volume":"7","author":"Gudy\u015b","year":"2017","journal-title":"Sci. Rep"},{"key":"2023012713012005500_bty121-B7","article-title":"MAFFT online service: multiple sequence alignment, interactive sequence choice and visualization","author":"Katoh","year":"2017","journal-title":"Brief Bioinformatics"},{"key":"2023012713012005500_bty121-B8","doi-asserted-by":"crossref","first-page":"1331","DOI":"10.1093\/bioinformatics\/btw840","article-title":"Protein multiple sequence alignment benchmarking through secondary structure prediction","volume":"33","author":"Le","year":"2017","journal-title":"Bioinformatics"},{"key":"2023012713012005500_bty121-B9","doi-asserted-by":"crossref","first-page":"443","DOI":"10.1016\/0022-2836(70)90057-4","article-title":"A general method applicable to the search for similarities in the amino acid sequence of two proteins","volume":"48","author":"Needleman","year":"1970","journal-title":"J. Mol. Biol"},{"key":"2023012713012005500_bty121-B10","doi-asserted-by":"crossref","first-page":"407","DOI":"10.1093\/bioinformatics\/14.5.407","article-title":"COFFEE: an objective function for multiple sequence alignments","volume":"14","author":"Notredame","year":"1998","journal-title":"Bioinformatics"},{"key":"2023012713012005500_bty121-B11","doi-asserted-by":"crossref","first-page":"47.","DOI":"10.1186\/1471-2105-4-47","article-title":"OXBench: a benchmark for evaluation of protein multiple sequence alignment accuracy","volume":"4","author":"Raghava","year":"2003","journal-title":"BMC Bioinformatics"},{"key":"2023012713012005500_bty121-B12","doi-asserted-by":"crossref","first-page":"539","DOI":"10.1038\/msb.2011.75","article-title":"Fast, scalable generation of high-quality protein multiple sequence alignments using Clustal Omega","volume":"7","author":"Sievers","year":"2011","journal-title":"Mol. Syst. Biol"},{"key":"2023012713012005500_bty121-B13","doi-asserted-by":"crossref","first-page":"989","DOI":"10.1093\/bioinformatics\/btt093","article-title":"Making automated multiple alignments of very large numbers of protein sequences","volume":"29","author":"Sievers","year":"2013","journal-title":"Bioinformatics"},{"key":"2023012713012005500_bty121-B14","doi-asserted-by":"crossref","first-page":"3246","DOI":"10.1093\/bioinformatics\/btw412","article-title":"Application of the MAFFT sequence alignment program to large data\u2014reexamination of the usefulness of chained guide trees","volume":"32","author":"Yamada","year":"2016","journal-title":"Bioinformatics"}],"container-title":["Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/34\/14\/2490\/48917281\/bioinformatics_34_14_2490.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article-pdf\/34\/14\/2490\/48917281\/bioinformatics_34_14_2490.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,9,1]],"date-time":"2023-09-01T10:26:13Z","timestamp":1693563973000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/bioinformatics\/article\/34\/14\/2490\/4916099"}},"subtitle":[],"editor":[{"given":"John","family":"Hancock","sequence":"additional","affiliation":[]}],"short-title":[],"issued":{"date-parts":[[2018,3,1]]},"references-count":14,"journal-issue":{"issue":"14","published-print":{"date-parts":[[2018,7,15]]}},"URL":"https:\/\/doi.org\/10.1093\/bioinformatics\/bty121","relation":{},"ISSN":["1367-4803","1367-4811"],"issn-type":[{"value":"1367-4803","type":"print"},{"value":"1367-4811","type":"electronic"}],"subject":[],"published-other":{"date-parts":[[2018,7,15]]},"published":{"date-parts":[[2018,3,1]]}}}