{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,6]],"date-time":"2026-04-06T12:26:49Z","timestamp":1775478409911,"version":"3.50.1"},"reference-count":82,"publisher":"Springer Science and Business Media LLC","issue":"11","license":[{"start":{"date-parts":[[2021,11,16]],"date-time":"2021-11-16T00:00:00Z","timestamp":1637020800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2021,11,16]],"date-time":"2021-11-16T00:00:00Z","timestamp":1637020800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Nat Mach Intell"],"DOI":"10.1038\/s42256-021-00413-z","type":"journal-article","created":{"date-parts":[[2021,11,16]],"date-time":"2021-11-16T12:02:38Z","timestamp":1637064158000},"page":"936-944","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":74,"title":["The immuneML ecosystem for machine learning analysis of adaptive immune receptor repertoires"],"prefix":"10.1038","volume":"3","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-2484-3868","authenticated-orcid":false,"given":"Milena","family":"Pavlovi\u0107","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8900-075X","authenticated-orcid":false,"given":"Lonneke","family":"Scheffer","sequence":"additional","affiliation":[]},{"given":"Keshav","family":"Motwani","sequence":"additional","affiliation":[]},{"given":"Chakravarthi","family":"Kanduri","sequence":"additional","affiliation":[]},{"given":"Radmila","family":"Kompova","sequence":"additional","affiliation":[]},{"given":"Nikolay","family":"Vazov","sequence":"additional","affiliation":[]},{"given":"Knut","family":"Waagan","sequence":"additional","affiliation":[]},{"given":"Fabian L. M.","family":"Bernal","sequence":"additional","affiliation":[]},{"given":"Alexandre Almeida","family":"Costa","sequence":"additional","affiliation":[]},{"given":"Brian","family":"Corrie","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6692-0876","authenticated-orcid":false,"given":"Rahmad","family":"Akbar","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1639-1424","authenticated-orcid":false,"given":"Ghadi S.","family":"Al Hajj","sequence":"additional","affiliation":[]},{"given":"Gabriel","family":"Balaban","sequence":"additional","affiliation":[]},{"given":"Todd M.","family":"Brusko","sequence":"additional","affiliation":[]},{"given":"Maria","family":"Chernigovskaya","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9889-1221","authenticated-orcid":false,"given":"Scott","family":"Christley","sequence":"additional","affiliation":[]},{"given":"Lindsay G.","family":"Cowell","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9097-7963","authenticated-orcid":false,"given":"Robert","family":"Frank","sequence":"additional","affiliation":[]},{"given":"Ivar","family":"Grytten","sequence":"additional","affiliation":[]},{"given":"Sveinung","family":"Gundersen","sequence":"additional","affiliation":[]},{"given":"Ingrid Hob\u00e6k","family":"Haff","sequence":"additional","affiliation":[]},{"given":"Eivind","family":"Hovig","sequence":"additional","affiliation":[]},{"given":"Ping-Han","family":"Hsieh","sequence":"additional","affiliation":[]},{"given":"G\u00fcnter","family":"Klambauer","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6280-3130","authenticated-orcid":false,"given":"Marieke L.","family":"Kuijjer","sequence":"additional","affiliation":[]},{"given":"Christin","family":"Lund-Andersen","sequence":"additional","affiliation":[]},{"given":"Antonio","family":"Martini","sequence":"additional","affiliation":[]},{"given":"Thomas","family":"Minotto","sequence":"additional","affiliation":[]},{"given":"Johan","family":"Pensar","sequence":"additional","affiliation":[]},{"given":"Knut","family":"Rand","sequence":"additional","affiliation":[]},{"given":"Enrico","family":"Riccardi","sequence":"additional","affiliation":[]},{"given":"Philippe A.","family":"Robert","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5637-1041","authenticated-orcid":false,"given":"Artur","family":"Rocha","sequence":"additional","affiliation":[]},{"given":"Andrei","family":"Slabodkin","sequence":"additional","affiliation":[]},{"given":"Igor","family":"Snapkov","sequence":"additional","affiliation":[]},{"given":"Ludvig M.","family":"Sollid","sequence":"additional","affiliation":[]},{"given":"Dmytro","family":"Titov","sequence":"additional","affiliation":[]},{"given":"C\u00e9dric R.","family":"Weber","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5721-0135","authenticated-orcid":false,"given":"Michael","family":"Widrich","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9311-9884","authenticated-orcid":false,"given":"Gur","family":"Yaari","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2622-5032","authenticated-orcid":false,"given":"Victor","family":"Greiff","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4959-1409","authenticated-orcid":false,"given":"Geir Kjetil","family":"Sandve","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2021,11,16]]},"reference":[{"key":"413_CR1","doi-asserted-by":"publisher","first-page":"701","DOI":"10.1039\/C9ME00071B","volume":"4","author":"AJ Brown","year":"2019","unstructured":"Brown, A. J. et al. Augmenting adaptive immunity: progress and challenges in the quantitative engineering and analysis of adaptive immune receptor repertoires. Mol. Syst. Des. Eng. 4, 701\u2013736 (2019).","journal-title":"Mol. Syst. Des. Eng."},{"key":"413_CR2","doi-asserted-by":"publisher","first-page":"158","DOI":"10.1038\/nbt.2782","volume":"32","author":"G Georgiou","year":"2014","unstructured":"Georgiou, G. et al. The promise and challenge of high-throughput sequencing of the antibody repertoire. Nat. Biotechnol. 32, 158\u2013168 (2014).","journal-title":"Nat. Biotechnol."},{"key":"413_CR3","doi-asserted-by":"publisher","DOI":"10.1186\/s13073-015-0243-2","volume":"7","author":"G Yaari","year":"2015","unstructured":"Yaari, G. & Kleinstein, S. H. Practical guidelines for B-cell receptor repertoire sequencing analysis. Genome Med. 7, 121 (2015).","journal-title":"Genome Med."},{"key":"413_CR4","doi-asserted-by":"publisher","first-page":"101519","DOI":"10.1016\/j.isci.2020.101519","volume":"23","author":"L Csepregi","year":"2020","unstructured":"Csepregi, L., Ehling, R. A., Wagner, B. & Reddy, S. T. Immune literacy: reading, writing, and editing adaptive immunity. iScience 23, 101519 (2020).","journal-title":"iScience"},{"key":"413_CR5","doi-asserted-by":"publisher","first-page":"e38358","DOI":"10.7554\/eLife.38358","volume":"7","author":"WS DeWitt III","year":"2018","unstructured":"DeWitt, W. S. III et al. Human T cell receptor occurrence patterns encode immune history, genetic background, and receptor specificity. eLife 7, e38358 (2018).","journal-title":"eLife"},{"key":"413_CR6","doi-asserted-by":"publisher","first-page":"659","DOI":"10.1038\/ng.3822","volume":"49","author":"RO Emerson","year":"2017","unstructured":"Emerson, R. O. et al. Immunosequencing identifies signatures of cytomegalovirus exposure history and HLA-mediated effects on the T cell repertoire. Nat. Genet. 49, 659\u2013665 (2017).","journal-title":"Nat. Genet."},{"key":"413_CR7","doi-asserted-by":"publisher","first-page":"26","DOI":"10.1186\/s12979-020-00195-9","volume":"17","author":"C Krishna","year":"2020","unstructured":"Krishna, C., Chowell, D., G\u00f6nen, M., Elhanati, Y. & Chan, T. A. Genetic and environmental determinants of human TCR repertoire diversity. Immun. Ageing 17, 26 (2020).","journal-title":"Immun. Ageing"},{"key":"413_CR8","doi-asserted-by":"publisher","first-page":"2689","DOI":"10.4049\/jimmunol.1302064","volume":"192","author":"OV Britanova","year":"2014","unstructured":"Britanova, O. V. et al. Age-related decrease in TCR repertoire diversity measured with deep and normalized sequence profiling. J. Immunol. 192, 2689\u20132698 (2014).","journal-title":"J. Immunol."},{"key":"413_CR9","doi-asserted-by":"publisher","first-page":"2168","DOI":"10.1073\/pnas.1716146115","volume":"115","author":"T Schneider-Hohendorf","year":"2018","unstructured":"Schneider-Hohendorf, T. et al. Sex bias in MHC I-associated shaping of the adaptive immune system. Proc. Natl Acad. Sci. USA 115, 2168\u20132173 (2018).","journal-title":"Proc. Natl Acad. Sci. USA"},{"key":"413_CR10","doi-asserted-by":"publisher","unstructured":"Shemesh, O., Polak, P., Lundin, K. E. A., Sollid, L. M. & Yaari, G. Machine learning analysis of na\u00efve B-cell receptor repertoires stratifies celiac disease patients and controls. Front. Immunol. 12, https:\/\/doi.org\/10.3389\/fimmu.2021.627813 (2021).","DOI":"10.3389\/fimmu.2021.627813"},{"key":"413_CR11","doi-asserted-by":"publisher","unstructured":"Ostmeyer, J., Christley, S., Toby, I. T. & Cowell, L. G. Biophysicochemical motifs in T cell receptor sequences distinguish repertoires from tumor-infiltrating lymphocytes and adjacent healthy tissue. Cancer Res. https:\/\/doi.org\/10.1158\/0008-5472.CAN-18-2292 (2019).","DOI":"10.1158\/0008-5472.CAN-18-2292"},{"key":"413_CR12","doi-asserted-by":"publisher","first-page":"eaaz3738","DOI":"10.1126\/scitranslmed.aaz3738","volume":"12","author":"D Beshnova","year":"2020","unstructured":"Beshnova, D. et al. De novo prediction of cancer-associated T cell receptors for noninvasive cancer detection. Sci. Transl. Med. 12, eaaz3738 (2020).","journal-title":"Sci. Transl. Med."},{"key":"413_CR13","doi-asserted-by":"publisher","first-page":"1070","DOI":"10.1136\/annrheumdis-2019-215442","volume":"78","author":"X Liu","year":"2019","unstructured":"Liu, X. et al. T cell receptor \u03b2 repertoires as novel diagnostic markers for systemic lupus erythematosus and rheumatoid arthritis. Ann. Rheum. Dis. 78, 1070\u20131078 (2019).","journal-title":"Ann. Rheum. Dis."},{"key":"413_CR14","doi-asserted-by":"publisher","first-page":"626793","DOI":"10.3389\/fimmu.2021.626793","volume":"12","author":"RA Arnaout","year":"2021","unstructured":"Arnaout, R. A. et al. The future of blood testing is the immunome. Front. Immunol. 12, 626793 (2021).","journal-title":"Front. Immunol."},{"key":"413_CR15","doi-asserted-by":"publisher","unstructured":"Greiff, V., Yaari, G. & Cowell, L. Mining adaptive immune receptor repertoires for biological and clinical information using machine learning. Curr. Opin. Syst. Biol. https:\/\/doi.org\/10.1016\/j.coisb.2020.10.010 (2020).","DOI":"10.1016\/j.coisb.2020.10.010"},{"key":"413_CR16","doi-asserted-by":"publisher","first-page":"108856","DOI":"10.1016\/j.celrep.2021.108856","volume":"34","author":"R Akbar","year":"2021","unstructured":"Akbar, R. et al. A compact vocabulary of paratope-epitope interactions enables predictability of antibody-antigen binding. Cell Rep. 34, 108856 (2021).","journal-title":"Cell Rep."},{"key":"413_CR17","doi-asserted-by":"publisher","first-page":"89","DOI":"10.1038\/nature22383","volume":"547","author":"P Dash","year":"2017","unstructured":"Dash, P. et al. Quantifiable predictive features define epitope-specific T cell receptor repertoires. Nature 547, 89\u201393 (2017).","journal-title":"Nature"},{"key":"413_CR18","doi-asserted-by":"publisher","first-page":"94","DOI":"10.1038\/nature22976","volume":"547","author":"J Glanville","year":"2017","unstructured":"Glanville, J. et al. Identifying specificity groups in the T cell receptor repertoire. Nature 547, 94\u201398 (2017).","journal-title":"Nature"},{"key":"413_CR19","doi-asserted-by":"publisher","first-page":"1803","DOI":"10.3389\/fimmu.2020.01803","volume":"11","author":"I Springer","year":"2020","unstructured":"Springer, I., Besser, H., Tickotsky-Moskovitz, N., Dvorkin, S. & Louzoun, Y. Prediction of specific TCR-peptide binding from large dictionaries of TCR-peptide pairs. Front. Immunol. 11, 1803 (2020).","journal-title":"Front. Immunol."},{"key":"413_CR20","doi-asserted-by":"publisher","unstructured":"Friedensohn, S. et al. Convergent selection in antibody repertoires is revealed by deep learning. Preprint at bioRxiv https:\/\/doi.org\/10.1101\/2020.02.25.965673 (2020).","DOI":"10.1101\/2020.02.25.965673"},{"key":"413_CR21","doi-asserted-by":"publisher","first-page":"600","DOI":"10.1038\/s41551-021-00699-9","volume":"5","author":"DM Mason","year":"2021","unstructured":"Mason, D. M. et al. Optimization of therapeutic antibodies by predicting antigen specificity from antibody sequence via deep learning. Nat. Biomed. Eng. 5, 600\u2013612 (2021).","journal-title":"Nat. Biomed. Eng."},{"key":"413_CR22","doi-asserted-by":"publisher","unstructured":"Moris, P. et al. Current challenges for unseen-epitope TCR interaction prediction and a new perspective derived from image classification. Brief. Bioinform. https:\/\/doi.org\/10.1093\/bib\/bbaa318 (2020).","DOI":"10.1093\/bib\/bbaa318"},{"key":"413_CR23","doi-asserted-by":"publisher","first-page":"12","DOI":"10.3390\/antib9020012","volume":"9","author":"J Graves","year":"2020","unstructured":"Graves, J. et al. A review of deep learning methods for antibodies. Antibodies 9, 12 (2020).","journal-title":"Antibodies"},{"key":"413_CR24","doi-asserted-by":"publisher","first-page":"151","DOI":"10.1016\/j.tips.2020.12.004","volume":"42","author":"H Narayanan","year":"2021","unstructured":"Narayanan, H. et al. Machine learning for biologics: opportunities for protein engineering, developability, and formulation. Trends Pharmacol. Sci. 42, 151\u2013165 (2021).","journal-title":"Trends Pharmacol. Sci."},{"key":"413_CR25","doi-asserted-by":"publisher","first-page":"e9416","DOI":"10.15252\/msb.20199416","volume":"16","author":"DS Fischer","year":"2020","unstructured":"Fischer, D. S., Wu, Y., Schubert, B. & Theis, F. J. Predicting antigen specificity of single T cells based on TCR CDR3 regions. Mol. Syst. Biol. 16, e9416 (2020).","journal-title":"Mol. Syst. Biol."},{"key":"413_CR26","doi-asserted-by":"publisher","unstructured":"Laustsen, A. H., Greiff, V., Karatt-Vellatt, A., Muyldermans, S. & Jenkins, T. P. Animal immunization, in vitro display technologies, and machine learning for antibody discovery. Trends Biotechnol. https:\/\/doi.org\/10.1016\/j.tibtech.2021.03.003 (2021).","DOI":"10.1016\/j.tibtech.2021.03.003"},{"key":"413_CR27","doi-asserted-by":"publisher","first-page":"e1008814","DOI":"10.1371\/journal.pcbi.1008814","volume":"17","author":"E Jokinen","year":"2021","unstructured":"Jokinen, E., Huuhtanen, J., Mustjoki, S., Heinonen, M. & L\u00e4hdesm\u00e4ki, H. Predicting recognition between T cell receptors and epitopes with TCRGP. PLoS Comput. Biol. 17, e1008814 (2021).","journal-title":"PLoS Comput. Biol."},{"key":"413_CR28","doi-asserted-by":"publisher","first-page":"389","DOI":"10.1038\/s41576-019-0122-6","volume":"20","author":"G Eraslan","year":"2019","unstructured":"Eraslan, G., Avsec, \u017d., Gagneur, J. & Theis, F. J. Deep learning: new computational modelling techniques for genomics. Nat. Rev. Genet. 20, 389\u2013403 (2019).","journal-title":"Nat. Rev. Genet."},{"key":"413_CR29","doi-asserted-by":"publisher","first-page":"24","DOI":"10.1038\/s41591-018-0316-z","volume":"25","author":"A Esteva","year":"2019","unstructured":"Esteva, A. et al. A guide to deep learning in healthcare. Nat. Med. 25, 24\u201329 (2019).","journal-title":"Nat. Med."},{"key":"413_CR30","doi-asserted-by":"publisher","unstructured":"Vamathevan, J. et al. Applications of machine learning in drug discovery and development. Nat. Rev. Drug Discov. https:\/\/doi.org\/10.1038\/s41573-019-0024-5 (2019).","DOI":"10.1038\/s41573-019-0024-5"},{"key":"413_CR31","doi-asserted-by":"publisher","first-page":"829","DOI":"10.1038\/nbt.4233","volume":"36","author":"M Wainberg","year":"2018","unstructured":"Wainberg, M., Merico, D., Delong, A. & Frey, B. J. Deep learning in biomedicine. Nat. Biotechnol. 36, 829\u2013838 (2018).","journal-title":"Nat. Biotechnol."},{"key":"413_CR32","doi-asserted-by":"publisher","first-page":"214","DOI":"10.1016\/j.jtbi.2015.10.016","volume":"389","author":"G Lythe","year":"2016","unstructured":"Lythe, G., Callard, R. E., Hoare, R. L. & Molina-Par\u00eds, C. How many TCR clonotypes does a body maintain? J. Theor. Biol. 389, 214\u2013224 (2016).","journal-title":"J. Theor. Biol."},{"key":"413_CR33","doi-asserted-by":"publisher","first-page":"104","DOI":"10.1016\/j.coisb.2019.10.001","volume":"18","author":"T Mora","year":"2019","unstructured":"Mora, T. & Walczak, A. M. How many different clonotypes do immune repertoires contain? Curr. Opin. Syst. Biol. 18, 104\u2013110 (2019).","journal-title":"Curr. Opin. Syst. Biol."},{"key":"413_CR34","doi-asserted-by":"publisher","first-page":"393","DOI":"10.1038\/s41586-019-0879-y","volume":"566","author":"B Briney","year":"2019","unstructured":"Briney, B., Inderbitzin, A., Joyce, C. & Burton, D. R. Commonality despite exceptional diversity in the baseline human antibody repertoire. Nature 566, 393\u2013397 (2019).","journal-title":"Nature"},{"key":"413_CR35","doi-asserted-by":"publisher","unstructured":"Greiff, V. et al. Learning the high-dimensional immunogenomic features that predict public and private antibody repertoires. J. Immunol. https:\/\/doi.org\/10.4049\/jimmunol.1700594 (2017).","DOI":"10.4049\/jimmunol.1700594"},{"key":"413_CR36","doi-asserted-by":"publisher","first-page":"691","DOI":"10.1016\/j.chom.2013.05.008","volume":"13","author":"P Parameswaran","year":"2013","unstructured":"Parameswaran, P. et al. Convergent antibody signatures in human dengue. Cell Host Microbe 13, 691\u2013700 (2013).","journal-title":"Cell Host Microbe"},{"key":"413_CR37","doi-asserted-by":"publisher","first-page":"3181","DOI":"10.1093\/bioinformatics\/btu523","volume":"30","author":"N Thomas","year":"2014","unstructured":"Thomas, N. et al. Tracking global changes induced in the CD4 T-cell receptor repertoire by immunization with a complex antigen using short stretches of CDR3 protein sequence. Bioinformatics 30, 3181\u20133188 (2014).","journal-title":"Bioinformatics"},{"key":"413_CR38","doi-asserted-by":"publisher","first-page":"268","DOI":"10.1177\/2050640614540154","volume":"2","author":"A Christophersen","year":"2014","unstructured":"Christophersen, A. et al. Tetramer-visualized gluten-specific CD4+ T cells in blood as a potential diagnostic marker for coeliac disease without oral gluten challenge. United Eur. Gastroenterol. J. 2, 268\u2013278 (2014).","journal-title":"United Eur. Gastroenterol. J."},{"key":"413_CR39","first-page":"18832","volume":"33","author":"M Widrich","year":"2020","unstructured":"Widrich, M. et al. Modern Hopfield networks and attention for immune repertoire classification. Adv. Neural Inf. Process. Syst. 33, 18832\u201318845 (2020).","journal-title":"Adv. Neural Inf. Process. Syst."},{"key":"413_CR40","doi-asserted-by":"publisher","DOI":"10.1038\/s41467-021-21879-w","volume":"12","author":"J-W Sidhom","year":"2021","unstructured":"Sidhom, J.-W., Larman, H. B., Pardoll, D. M. & Baras, A. S. DeepTCR is a deep learning framework for revealing sequence concepts within T-cell repertoires. Nat. Commun. 12, 1605 (2021).","journal-title":"Nat. Commun."},{"key":"413_CR41","doi-asserted-by":"publisher","first-page":"315","DOI":"10.1038\/s41592-019-0360-8","volume":"16","author":"KM Chen","year":"2019","unstructured":"Chen, K. M., Cofer, E. M., Zhou, J. & Troyanskaya, O. G. Selene: a PyTorch-based deep learning library for sequence data. Nat. Methods 16, 315\u2013318 (2019).","journal-title":"Nat. Methods"},{"key":"413_CR42","doi-asserted-by":"publisher","DOI":"10.1038\/s41467-020-17155-y","volume":"11","author":"W Kopp","year":"2020","unstructured":"Kopp, W., Monti, R., Tamburrini, A., Ohler, U. & Akalin, A. Deep learning for genomics using Janggu. Nat. Commun. 11, 3488 (2020).","journal-title":"Nat. Commun."},{"key":"413_CR43","doi-asserted-by":"publisher","first-page":"409","DOI":"10.1038\/nbt.3825","volume":"35","author":"J Feng","year":"2017","unstructured":"Feng, J. et al. Firmiana: towards a one-stop proteomic cloud platform for data processing and analysis. Nat. Biotechnol. 35, 409\u2013412 (2017).","journal-title":"Nat. Biotechnol."},{"key":"413_CR44","doi-asserted-by":"publisher","first-page":"509","DOI":"10.1038\/s41592-019-0426-7","volume":"16","author":"S Gessulat","year":"2019","unstructured":"Gessulat, S. et al. Prosit: proteome-wide prediction of peptide tandem mass spectra by deep learning. Nat. Methods 16, 509\u2013518 (2019).","journal-title":"Nat. Methods"},{"key":"413_CR45","doi-asserted-by":"publisher","first-page":"100178","DOI":"10.1016\/j.patter.2020.100178","volume":"2","author":"A Tomic","year":"2021","unstructured":"Tomic, A. et al. SIMON: Open-source knowledge discovery platform. Patterns 2, 100178 (2021).","journal-title":"Patterns"},{"key":"413_CR46","doi-asserted-by":"publisher","first-page":"513","DOI":"10.1039\/C7SC02664A","volume":"9","author":"Z Wu","year":"2018","unstructured":"Wu, Z. et al. MoleculeNet: a benchmark for molecular machine learning. Chem. Sci. 9, 513\u2013530 (2018).","journal-title":"Chem. Sci."},{"key":"413_CR47","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa, F. et al. Scikit-learn: machine learning in Python. J. Mach. Learn. Res. 12, 2825\u20132830 (2011).","journal-title":"J. Mach. Learn. Res."},{"key":"413_CR48","unstructured":"Paszke, A. et al. in Advances in Neural Information Processing Systems 32 (eds Wallach, H. et al.) 8026\u20138037 (Curran Associates, Inc., 2019)."},{"key":"413_CR49","doi-asserted-by":"publisher","first-page":"W537","DOI":"10.1093\/nar\/gky379","volume":"46","author":"E Afgan","year":"2018","unstructured":"Afgan, E. et al. The Galaxy platform for accessible, reproducible and collaborative biomedical analyses: 2018 update. Nucleic Acids Res. 46, W537\u2013W544 (2018).","journal-title":"Nucleic Acids Res."},{"key":"413_CR50","doi-asserted-by":"publisher","first-page":"1274","DOI":"10.1038\/ni.3873","volume":"18","author":"F Rubelt","year":"2017","unstructured":"Rubelt, F. et al. Adaptive immune receptor repertoire community recommendations for sharing immune-repertoire sequencing data. Nat. Immunol. 18, 1274\u20131278 (2017).","journal-title":"Nat. Immunol."},{"key":"413_CR51","doi-asserted-by":"publisher","first-page":"2206","DOI":"10.3389\/fimmu.2018.02206","volume":"9","author":"JA Vander Heiden","year":"2018","unstructured":"Vander Heiden, J. A. et al. AIRR community standardized representations for annotated immune repertoires. Front. Immunol. 9, 2206 (2018).","journal-title":"Front. Immunol."},{"key":"413_CR52","doi-asserted-by":"publisher","first-page":"380","DOI":"10.1038\/nmeth.3364","volume":"12","author":"DA Bolotin","year":"2015","unstructured":"Bolotin, D. A. et al. MiXCR: software for comprehensive adaptive immunity profiling. Nat. Methods 12, 380\u2013381 (2015).","journal-title":"Nat. Methods"},{"key":"413_CR53","doi-asserted-by":"publisher","first-page":"3356","DOI":"10.1093\/bioinformatics\/btv359","volume":"31","author":"NT Gupta","year":"2015","unstructured":"Gupta, N. T. et al. Change-O: a toolkit for analyzing large-scale B cell immunoglobulin repertoire sequencing data. Bioinformatics 31, 3356\u20133358 (2015).","journal-title":"Bioinformatics"},{"key":"413_CR54","doi-asserted-by":"publisher","first-page":"1930","DOI":"10.1093\/bioinformatics\/btu138","volume":"30","author":"JA Vander Heiden","year":"2014","unstructured":"Vander Heiden, J. A. et al. pRESTO: a toolkit for processing high-throughput sequencing raw reads of lymphocyte receptor repertoires. Bioinformatics 30, 1930\u20131932 (2014).","journal-title":"Bioinformatics"},{"key":"413_CR55","doi-asserted-by":"publisher","unstructured":"Nazarov, V., immunarch.bot & Rumynskiy, E. immunomind\/immunarch: 0.6.5: basic single-cell support. Zenodo https:\/\/doi.org\/10.5281\/zenodo.3893991 (2020).","DOI":"10.5281\/zenodo.3893991"},{"key":"413_CR56","doi-asserted-by":"publisher","first-page":"22","DOI":"10.3389\/fdata.2020.00022","volume":"3","author":"S Christley","year":"2020","unstructured":"Christley, S. et al. The ADC API: a web API for the programmatic query of the AIRR data commons. Front. Big Data 3, 22 (2020).","journal-title":"Front. Big Data"},{"key":"413_CR57","doi-asserted-by":"publisher","first-page":"24","DOI":"10.1111\/imr.12666","volume":"284","author":"BD Corrie","year":"2018","unstructured":"Corrie, B. D. et al. iReceptor: a platform for querying and analyzing antibody\/B-cell and T-cell receptor repertoire data across federated repositories. Immunol. Rev. 284, 24\u201341 (2018).","journal-title":"Immunol. Rev."},{"key":"413_CR58","doi-asserted-by":"publisher","first-page":"D1057","DOI":"10.1093\/nar\/gkz874","volume":"48","author":"DV Bagaev","year":"2020","unstructured":"Bagaev, D. V. et al. VDJdb in 2019: database extension, new analysis infrastructure and a T-cell receptor motif compendium. Nucleic Acids Res. 48, D1057\u2013D1062 (2020).","journal-title":"Nucleic Acids Res."},{"key":"413_CR59","doi-asserted-by":"publisher","unstructured":"Huang, H., Wang, C., Rubelt, F., Scriba, T. J. & Davis, M. M. Analyzing the Mycobacterium tuberculosis immune response by T-cell receptor clustering with GLIPH2 and genome-wide antigen screening. Nat. Biotechnol. https:\/\/doi.org\/10.1038\/s41587-020-0505-4 (2020).","DOI":"10.1038\/s41587-020-0505-4"},{"key":"413_CR60","doi-asserted-by":"publisher","DOI":"10.1038\/ncomms14049","volume":"8","author":"GXY Zheng","year":"2017","unstructured":"Zheng, G. X. Y. et al. Massively parallel digital transcriptional profiling of single cells. Nat. Commun. 8, 14049 (2017).","journal-title":"Nat. Commun."},{"key":"413_CR61","doi-asserted-by":"publisher","unstructured":"Nolan, S. et al. A large-scale database of T-cell receptor beta (TCR\u03b2) sequences and binding associations from natural and synthetic exposure to SARS-CoV-2. Preprint at Research Square https:\/\/doi.org\/10.21203\/rs.3.rs-51964\/v1 (2020).","DOI":"10.21203\/rs.3.rs-51964\/v1"},{"key":"413_CR62","doi-asserted-by":"publisher","first-page":"3594","DOI":"10.1093\/bioinformatics\/btaa158","volume":"36","author":"CR Weber","year":"2020","unstructured":"Weber, C. R. et al. immuneSIM: tunable multi-feature simulation of B- and T-cell receptor repertoires for immunoinformatics benchmarking. Bioinformatics 36, 3594\u20133596 (2020).","journal-title":"Bioinformatics"},{"key":"413_CR63","doi-asserted-by":"publisher","unstructured":"Marcou, Q., Mora, T. & Walczak, A.M. High-throughput immune repertoire analysis with IGoR. Nat Commun 9, 561 (2018). https:\/\/doi.org\/10.1038\/s41467-018-02832-w","DOI":"10.1038\/s41467-018-02832-w"},{"key":"413_CR64","doi-asserted-by":"publisher","first-page":"2974","DOI":"10.1093\/bioinformatics\/btz035","volume":"35","author":"Z Sethna","year":"2019","unstructured":"Sethna, Z., Elhanati, Y., Callan, C. G., Walczak, A. M. & Mora, T. OLGA: fast computation of generation probabilities of B- and T-cell receptor amino acid sequences and motifs. Bioinformatics 35, 2974\u20132981 (2019).","journal-title":"Bioinformatics"},{"key":"413_CR65","doi-asserted-by":"crossref","unstructured":"FAIR principles for data stewardship. Nat. Genet. 48, 343\u2013343 (2016).","DOI":"10.1038\/ng.3544"},{"key":"413_CR66","doi-asserted-by":"publisher","first-page":"71","DOI":"10.1016\/j.coisb.2020.10.001","volume":"24","author":"JK Scott","year":"2020","unstructured":"Scott, J. K. & Breden, F. The adaptive immune receptor repertoire community as a model for FAIR stewardship of big immunology data. Curr. Opin. Syst. Biol. 24, 71\u201377 (2020).","journal-title":"Curr. Opin. Syst. Biol."},{"key":"413_CR67","doi-asserted-by":"publisher","first-page":"1418","DOI":"10.3389\/fimmu.2017.01418","volume":"8","author":"F Breden","year":"2017","unstructured":"Breden, F. et al. Reproducibility and reuse of adaptive immune receptor repertoire data. Front. Immunol. 8, 1418 (2017).","journal-title":"Front. Immunol."},{"key":"413_CR68","doi-asserted-by":"crossref","unstructured":"Software with impact. Nat. Methods 11, 211 (2014).","DOI":"10.1038\/nmeth.2880"},{"key":"413_CR69","doi-asserted-by":"publisher","first-page":"341ps12","DOI":"10.1126\/scitranslmed.aaf5027","volume":"8","author":"SN Goodman","year":"2016","unstructured":"Goodman, S. N., Fanelli, D. & Ioannidis, J. P. A. What does research reproducibility mean? Sci. Transl. Med. 8, 341ps12 (2016).","journal-title":"Sci. Transl. Med."},{"key":"413_CR70","doi-asserted-by":"publisher","unstructured":"Mayer-Blackwell, K. et al. TCR meta-clonotypes for biomarker discovery with tcrdist3: quantification of public, HLA-restricted TCR biomarkers of SARS-CoV-2 infection. Preprint at bioRxiv https:\/\/doi.org\/10.1101\/2020.12.24.424260 (2020).","DOI":"10.1101\/2020.12.24.424260"},{"key":"413_CR71","unstructured":"Abadi, M. et al. TensorFlow: a system for large-scale machine learning. In Proc. 12th USENIX Conference on Operating Systems Design and Implementation 265\u2013283 (USENIX Association, 2016)."},{"key":"413_CR72","doi-asserted-by":"publisher","first-page":"2166","DOI":"10.1016\/j.csbj.2020.06.041","volume":"18","author":"M Vujovic","year":"2020","unstructured":"Vujovic, M. et al. T cell receptor sequence clustering and antigen specificity. Comput. Struct. Biotechnol. J. 18, 2166\u20132173 (2020).","journal-title":"Comput. Struct. Biotechnol. J."},{"key":"413_CR73","doi-asserted-by":"publisher","first-page":"e46935","DOI":"10.7554\/eLife.46935","volume":"8","author":"K Davidsen","year":"2019","unstructured":"Davidsen, K. et al. Deep generative models for T cell receptor protein sequences. eLife 8, e46935 (2019).","journal-title":"eLife"},{"key":"413_CR74","doi-asserted-by":"publisher","first-page":"7345","DOI":"10.1073\/pnas.1510507113","volume":"113","author":"E Bareinboim","year":"2016","unstructured":"Bareinboim, E. & Pearl, J. Causal inference and the data-fusion problem. Proc. Natl Acad. Sci. USA 113, 7345\u20137352 (2016).","journal-title":"Proc. Natl Acad. Sci. USA"},{"key":"413_CR75","doi-asserted-by":"publisher","unstructured":"Pavlovic, M. et al. immuneML: v2.0.2. Zenodo https:\/\/doi.org\/10.5281\/zenodo.5118741 (2021)","DOI":"10.5281\/zenodo.5118741"},{"key":"413_CR76","unstructured":"Fowler, M. Domain-Specific Languages (Addison-Wesley Professional, 2010)."},{"key":"413_CR77","unstructured":"Zenger, M. Programming Language Abstractions for Extensible Software Components Ch. 1.3 (Swiss Federal Institute of Technology, 2004)."},{"key":"413_CR78","doi-asserted-by":"publisher","unstructured":"Pavlovi\u0107, M. immuneML use case 1: replication of a published study inside immuneML. NIRD Research Data Archive https:\/\/doi.org\/10.11582\/2021.00008 (2021).","DOI":"10.11582\/2021.00008"},{"key":"413_CR79","doi-asserted-by":"publisher","unstructured":"Ploenzke, M. S. & Irizarry, R. A. Interpretable convolution methods for learning genomic sequence motifs. Preprint at bioRxiv https:\/\/doi.org\/10.1101\/411934 (2018).","DOI":"10.1101\/411934"},{"key":"413_CR80","doi-asserted-by":"publisher","first-page":"112","DOI":"10.1016\/j.molimm.2020.09.003","volume":"127","author":"N Heikkil\u00e4","year":"2020","unstructured":"Heikkil\u00e4, N. et al. Human thymic T cell repertoire is imprinted with strong convergence to shared sequences. Mol. Immunol. 127, 112\u2013123 (2020).","journal-title":"Mol. Immunol."},{"key":"413_CR81","doi-asserted-by":"publisher","unstructured":"Pavlovi\u0107, M. immuneML use case 2: extending immuneML with a deep learning component for predicting antigen specificity of paired receptor data. NIRD Research Data Archive https:\/\/doi.org\/10.11582\/2021.00009 (2021).","DOI":"10.11582\/2021.00009"},{"key":"413_CR82","doi-asserted-by":"publisher","unstructured":"Scheffer, L. immuneML use case 3: benchmarking ML methods for AIRR classification on ground-truth synthetic data. NIRD Research Data Archive https:\/\/doi.org\/10.11582\/2021.00005 (2021).","DOI":"10.11582\/2021.00005"}],"container-title":["Nature Machine Intelligence"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/www.nature.com\/articles\/s42256-021-00413-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/www.nature.com\/articles\/s42256-021-00413-z","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/www.nature.com\/articles\/s42256-021-00413-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,2,8]],"date-time":"2023-02-08T14:04:59Z","timestamp":1675865099000},"score":1,"resource":{"primary":{"URL":"https:\/\/www.nature.com\/articles\/s42256-021-00413-z"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,11,16]]},"references-count":82,"journal-issue":{"issue":"11","published-online":{"date-parts":[[2021,11]]}},"alternative-id":["413"],"URL":"https:\/\/doi.org\/10.1038\/s42256-021-00413-z","relation":{"has-preprint":[{"id-type":"doi","id":"10.1101\/2021.03.08.433891","asserted-by":"object"}]},"ISSN":["2522-5839"],"issn-type":[{"value":"2522-5839","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021,11,16]]},"assertion":[{"value":"7 April 2021","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"6 October 2021","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"16 November 2021","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"V.G. declares advisory board positions in aiNET GmbH and Enpicom B.V., and is a consultant for Roche\/Genentech.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}]}}