{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,29]],"date-time":"2026-03-29T01:32:20Z","timestamp":1774747940055,"version":"3.50.1"},"reference-count":127,"publisher":"Public Library of Science (PLoS)","issue":"3","license":[{"start":{"date-parts":[[2022,3,24]],"date-time":"2022-03-24T00:00:00Z","timestamp":1648080000000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"DOI":"10.13039\/501100008982","name":"National Science Foundation","doi-asserted-by":"publisher","award":["DBI 1553206"],"award-info":[{"award-number":["DBI 1553206"]}],"id":[{"id":"10.13039\/501100008982","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","award":["R01GM135631"],"award-info":[{"award-number":["R01GM135631"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","award":["R01 HG010067"],"award-info":[{"award-number":["R01 HG010067"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000936","name":"Gordon and Betty Moore Foundation","doi-asserted-by":"publisher","award":["GBMF 4552"],"award-info":[{"award-number":["GBMF 4552"]}],"id":[{"id":"10.13039\/100000936","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Wisconsin Alumni Foundation","award":["AAD5912"],"award-info":[{"award-number":["AAD5912"]}]},{"name":"Donald Hill Family Fellowship"},{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","award":["R01DE027809"],"award-info":[{"award-number":["R01DE027809"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000936","name":"Gordon and Betty Moore Foundation","doi-asserted-by":"publisher","award":["GBMF 4552"],"award-info":[{"award-number":["GBMF 4552"]}],"id":[{"id":"10.13039\/100000936","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100005825","name":"USDA National Institute of Food and Agriculture","doi-asserted-by":"crossref","award":["2020-67012-31772"],"award-info":[{"award-number":["2020-67012-31772"]}],"id":[{"id":"10.13039\/100005825","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/100009164","name":"Moffitt Cancer Center","doi-asserted-by":"publisher","award":["P30-CA076292"],"award-info":[{"award-number":["P30-CA076292"]}],"id":[{"id":"10.13039\/100009164","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","award":["T32 HG003284"],"award-info":[{"award-number":["T32 HG003284"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100008982","name":"National Science Foundation","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100008982","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Blavatnik Center for Computational Biomedicine"},{"DOI":"10.13039\/100000057","name":"National Institute of General Medical Sciences","doi-asserted-by":"crossref","award":["R35GM142879"],"award-info":[{"award-number":["R35GM142879"]}],"id":[{"id":"10.13039\/100000057","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/100005979","name":"Lustgarten Foundation","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100005979","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100012298","name":"Allegheny Health Network","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100012298","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Emerson Foundation","award":["640183"],"award-info":[{"award-number":["640183"]}]},{"name":"National Cancer Institute","award":["U01CA212007, U01CA253403, P30CA006973"],"award-info":[{"award-number":["U01CA212007, U01CA253403, P30CA006973"]}]},{"name":"National Institute of Dental and CraniofacialResearch","award":["R01DE027809"],"award-info":[{"award-number":["R01DE027809"]}]},{"DOI":"10.13039\/100000060","name":"National Institute of Allergy and Infectious Diseases","doi-asserted-by":"publisher","award":["R21AI153997"],"award-info":[{"award-number":["R21AI153997"]}],"id":[{"id":"10.13039\/100000060","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Michelle Lunn Hope Foundation"},{"name":"Folz Fund for Cancer Research"},{"name":"Grand Rapids Community Foundation"},{"DOI":"10.13039\/100000002","name":"National Institutes of Health","doi-asserted-by":"publisher","award":["R21 CA220398"],"award-info":[{"award-number":["R21 CA220398"]}],"id":[{"id":"10.13039\/100000002","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["www.ploscompbiol.org"],"crossmark-restriction":false},"short-container-title":["PLoS Comput Biol"],"DOI":"10.1371\/journal.pcbi.1009803","type":"journal-article","created":{"date-parts":[[2022,3,24]],"date-time":"2022-03-24T21:22:09Z","timestamp":1648156929000},"page":"e1009803","update-policy":"https:\/\/doi.org\/10.1371\/journal.pcbi.corrections_policy","source":"Crossref","is-referenced-by-count":39,"title":["Ten quick tips for deep learning in biology"],"prefix":"10.1371","volume":"18","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-7133-8397","authenticated-orcid":true,"given":"Benjamin D.","family":"Lee","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5324-9833","authenticated-orcid":true,"given":"Anthony","family":"Gitter","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8713-9213","authenticated-orcid":true,"given":"Casey S.","family":"Greene","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6989-4493","authenticated-orcid":true,"given":"Sebastian","family":"Raschka","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1203-9514","authenticated-orcid":true,"given":"Finlay","family":"Maguire","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0145-9564","authenticated-orcid":true,"given":"Alexander J.","family":"Titus","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1258-5221","authenticated-orcid":true,"given":"Michael D.","family":"Kessler","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0208-3730","authenticated-orcid":true,"given":"Alexandra J.","family":"Lee","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7209-0717","authenticated-orcid":true,"given":"Marc G.","family":"Chevrette","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0882-308X","authenticated-orcid":true,"given":"Paul Allen","family":"Stewart","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6218-4429","authenticated-orcid":true,"given":"Thiago","family":"Britto-Borges","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3877-0433","authenticated-orcid":true,"given":"Evan M.","family":"Cofer","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9892-8218","authenticated-orcid":true,"given":"Kun-Hsing","family":"Yu","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3029-4658","authenticated-orcid":true,"given":"Juan Jose","family":"Carmona","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3204-342X","authenticated-orcid":true,"given":"Elana J.","family":"Fertig","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4563-3226","authenticated-orcid":true,"given":"Alexandr A.","family":"Kalinin","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6839-2392","authenticated-orcid":true,"given":"Brandon","family":"Signal","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8690-9554","authenticated-orcid":true,"given":"Benjamin J.","family":"Lengerich","sequence":"additional","affiliation":[]},{"given":"Timothy J.","family":"Triche","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1400-3398","authenticated-orcid":true,"given":"Simina M.","family":"Boca","sequence":"additional","affiliation":[]}],"member":"340","published-online":{"date-parts":[[2022,3,24]]},"reference":[{"key":"pcbi.1009803.ref001","doi-asserted-by":"crossref","first-page":"335","DOI":"10.1038\/s41583-020-0277-3","article-title":"Backpropagation and the brain","volume":"21","author":"TP Lillicrap","year":"2020","journal-title":"Nat Rev Neurosci"},{"key":"pcbi.1009803.ref002","doi-asserted-by":"crossref","first-page":"20170387","DOI":"10.1098\/rsif.2017.0387","article-title":"Opportunities and obstacles for deep learning in biology and medicine","volume":"15","author":"T Ching","year":"2018","journal-title":"J R Soc Interface"},{"key":"pcbi.1009803.ref003","doi-asserted-by":"crossref","first-page":"5","DOI":"10.1038\/s41467-017-02388-1","article-title":"VAMPnets for deep learning of molecular kinetics","volume":"9","author":"A Mardt","year":"2018","journal-title":"Nat Commun"},{"key":"pcbi.1009803.ref004","doi-asserted-by":"crossref","first-page":"3135","DOI":"10.1038\/s41467-018-05378-z","article-title":"Deep learning to predict the lab-of-origin of engineered DNA","volume":"9","author":"AAK Nielsen","year":"2018","journal-title":"Nat Commun"},{"key":"pcbi.1009803.ref005","doi-asserted-by":"crossref","first-page":"60","DOI":"10.1038\/s41591-018-0279-0","article-title":"Identifying facial phenotypes of genetic disorders using deep learning","volume":"25","author":"Y Gurovich","year":"2019","journal-title":"Nat Med"},{"key":"pcbi.1009803.ref006","article-title":"Benjamin-Lee\/deep-rules GitHub repository.","author":"B. Lee","year":"2018","journal-title":"GitHub"},{"key":"pcbi.1009803.ref007","doi-asserted-by":"crossref","first-page":"e1007128","DOI":"10.1371\/journal.pcbi.1007128","article-title":"Open collaborative writing with Manubot","volume":"15","author":"DS Himmelstein","year":"2019","journal-title":"PLoS Comput Biol"},{"key":"pcbi.1009803.ref008","volume-title":"Python machine learning: machine learning and deep learning with Python, scikit-learn, and TensorFlow 2.","author":"S Raschka","year":"2019","edition":"3"},{"key":"pcbi.1009803.ref009","doi-asserted-by":"crossref","first-page":"35","DOI":"10.1186\/s13040-017-0155-3","article-title":"Ten quick tips for machine learning in computational biology","volume":"10","author":"D. Chicco","year":"2017","journal-title":"BioData Min"},{"key":"pcbi.1009803.ref010","doi-asserted-by":"crossref","unstructured":"Rudin C, Carlson D. The Secrets of Machine Learning: Ten Things You Wish You Had Known Earlier to be More Effective at Data Analysis. arXiv. 2019 Jun. Report No.: 1906.01998. Available from: https:\/\/arxiv.org\/abs\/1906.01998","DOI":"10.1287\/educ.2019.0200"},{"key":"pcbi.1009803.ref011","article-title":"A guide to machine learning for biologists","author":"JG Greener","year":"2021","journal-title":"Nat Rev Mol Cell Biol"},{"key":"pcbi.1009803.ref012","doi-asserted-by":"crossref","first-page":"630","DOI":"10.1089\/omi.2018.0097","article-title":"Rise of Deep Learning for Genomic, Proteomic, and Metabolomic Data Integration in Precision Medicine","volume":"22","author":"D Grapov","year":"2018","journal-title":"OMICS"},{"key":"pcbi.1009803.ref013","volume-title":"Advances in Intelligent Systems and Computing","author":"A Mathew","year":"2021"},{"key":"pcbi.1009803.ref014","doi-asserted-by":"crossref","first-page":"193","DOI":"10.3390\/info11040193","article-title":"Machine Learning in Python: Main Developments and Technology Trends in Data Science, Machine Learning, and Artificial Intelligence","volume":"11","author":"S Raschka","year":"2020","journal-title":"Information"},{"key":"pcbi.1009803.ref015","doi-asserted-by":"crossref","first-page":"303","DOI":"10.1007\/BF02551274","article-title":"Approximation by superpositions of a sigmoidal function","volume":"2","author":"G. Cybenko","year":"1989","journal-title":"Math Control Signals Syst"},{"key":"pcbi.1009803.ref016","doi-asserted-by":"crossref","first-page":"251","DOI":"10.1016\/0893-6080(91)90009-T","article-title":"Approximation capabilities of multilayer feedforward networks","volume":"4","author":"K. Hornik","year":"1991","journal-title":"Neural Netw"},{"key":"pcbi.1009803.ref017","doi-asserted-by":"crossref","first-page":"125","DOI":"10.3390\/info11020125","article-title":"Albumentations: Fast and Flexible Image Augmentations","volume":"11","author":"A Buslaev","year":"2020","journal-title":"Information"},{"key":"pcbi.1009803.ref018","unstructured":"Ratner A, De Sa C, Wu S, Selsam D, R\u00e9 C. Data Programming: Creating Large Training Sets, Quickly. arXiv. 2016 May. Report No.: 1605.07723v3. Available from: https:\/\/arxiv.org\/abs\/1605.07723v3"},{"key":"pcbi.1009803.ref019","article-title":"Deep Learning for Microalgae Classification","author":"I Correa","year":"2017","journal-title":"Institute of Electrical and Electronics Engineers (IEEE)"},{"key":"pcbi.1009803.ref020","article-title":"WeText: Scene Text Detection under Weak Supervision","author":"S Tian","year":"2017","journal-title":"Institute of Electrical and Electronics Engineers (IEEE)."},{"key":"pcbi.1009803.ref021","doi-asserted-by":"crossref","first-page":"1510","DOI":"10.1038\/s41386-021-01020-7","article-title":"Systematic misestimation of machine learning performance in neuroimaging studies of depression","volume":"46","author":"C Flint","year":"2021","journal-title":"Neuropsychopharmacology"},{"key":"pcbi.1009803.ref022","article-title":"Revisiting Unreasonable Effectiveness of Data in Deep Learning Era","author":"C Sun","year":"2017","journal-title":"Institute of Electrical and Electronics Engineers (IEEE)."},{"key":"pcbi.1009803.ref023","doi-asserted-by":"crossref","DOI":"10.18653\/v1\/2020.acl-main.747","article-title":"Unsupervised Cross-lingual Representation Learning at Scale","author":"A Conneau","year":"2020","journal-title":"Association for Computational Linguistics (ACL)."},{"key":"pcbi.1009803.ref024","unstructured":"Cho J, Lee K, Shin E, Choy G, Do S. How much data is needed to train a medical image deep learning system to achieve necessary high accuracy? arXiv. 2016 Jan. Report No.: 1511.06348. Available from: https:\/\/arxiv.org\/abs\/1511.06348"},{"key":"pcbi.1009803.ref025","doi-asserted-by":"crossref","first-page":"2295","DOI":"10.1109\/JPROC.2017.2761740","article-title":"Efficient Processing of Deep Neural Networks: A Tutorial and Survey","volume":"105","author":"V Sze","year":"2017","journal-title":"Proc IEEE"},{"key":"pcbi.1009803.ref026","unstructured":"Brown TB, Mann B, Ryder N, Subbiah M, Kaplan J, Dhariwal P, et al. Language Models are Few-Shot Learners. arXiv. 2020 Jul. Report No.: 2005.14165. Available from: https:\/\/arxiv.org\/abs\/2005.14165"},{"key":"pcbi.1009803.ref027","doi-asserted-by":"crossref","unstructured":"Strubell E, Ganesh A, McCallum A. Energy and Policy Considerations for Deep Learning in NLP. arXiv. 2019 Jun. Report No.: 1906.02243. Available from: https:\/\/arxiv.org\/abs\/1906.02243","DOI":"10.18653\/v1\/P19-1355"},{"key":"pcbi.1009803.ref028","doi-asserted-by":"crossref","unstructured":"Madani A, McCann B, Naik N, Keskar NS, Anand N, Eguchi RR, et al. ProGen: Language Modeling for Protein Generation. arXiv. 2020 Apr. Report No.: 2004.03497. Available from: https:\/\/arxiv.org\/abs\/2004.03497","DOI":"10.1101\/2020.03.07.982272"},{"key":"pcbi.1009803.ref029","doi-asserted-by":"crossref","unstructured":"Elnaggar A, Heinzinger M, Dallago C, Rihawi G, Wang Y, Jones L, et al. ProtTrans: Towards Cracking the Language of Life\u2019s Code Through Self-Supervised Deep Learning and High Performance Computing. arXiv. 2021 May. Report No.: 2007.06225. Available from: https:\/\/arxiv.org\/abs\/2007.06225","DOI":"10.1101\/2020.07.12.199554"},{"key":"pcbi.1009803.ref030","doi-asserted-by":"crossref","first-page":"e2016239118","DOI":"10.1073\/pnas.2016239118","article-title":"Biological structure and function emerge from scaling unsupervised learning to 250 million protein sequences","volume":"118","author":"A Rives","year":"2021","journal-title":"Proc Natl Acad Sci"},{"key":"pcbi.1009803.ref031","unstructured":"Alsouda Y, Pllana S, Kurti A. A Machine Learning Driven IoT Solution for Noise Classification in Smart Cities. arXiv. 2018 Sep. Report No.: 1809.00238. Available from: https:\/\/arxiv.org\/abs\/1809.00238"},{"key":"pcbi.1009803.ref032","unstructured":"Abadi M, Agarwal A, Barham P, Brevdo E, Chen Z, Citro C, et al. Tensor Flow: Large-Scale Machine Learning on Heterogeneous Distributed Systems. arXiv. 2016 Mar. Report No.: 1603.04467. Available from: https:\/\/arxiv.org\/abs\/1603.04467"},{"key":"pcbi.1009803.ref033","unstructured":"Paszke A, Gross S, Massa F, Lerer A, Bradbury J, Chanan G, et al. PyTorch: An Imperative Style, High-Performance Deep Learning Library. arXiv. 2019 Dec. Report No.: 1912.01703. Available from: https:\/\/arxiv.org\/abs\/1912.01703"},{"key":"pcbi.1009803.ref034","first-page":"2825","article-title":"Scikit-learn: Machine Learning in Python","volume":"12","author":"F Pedregosa","year":"2011","journal-title":"J Mach Learn Res"},{"key":"pcbi.1009803.ref035","volume-title":"Lecture Notes in Computer Science","author":"RS Olson","year":"2016"},{"key":"pcbi.1009803.ref036","unstructured":"GitHub\u2014apple\/turicreate: Turi Create simplifies the development of custom machine learning models. In: GitHub [Internet]. [cited 2021 Nov 29]. Available from: https:\/\/github.com\/apple\/turicreate"},{"key":"pcbi.1009803.ref037","doi-asserted-by":"crossref","unstructured":"Jin H, Song Q, Hu X. Auto-Keras: An Efficient Neural Architecture Search System. arXiv. 2019 Mar. Report No.: 1806.10282. Available from: https:\/\/arxiv.org\/abs\/1806.10282","DOI":"10.1145\/3292500.3330648"},{"key":"pcbi.1009803.ref038","unstructured":"Keras: the Python deep learning API. [cited 2021 Nov 29]. Available from: https:\/\/keras.io\/"},{"key":"pcbi.1009803.ref039","doi-asserted-by":"crossref","first-page":"108","DOI":"10.3390\/info11020108","article-title":"Fastai: A Layered API for Deep Learning","volume":"11","author":"J Howard","year":"2020","journal-title":"Information"},{"key":"pcbi.1009803.ref040","doi-asserted-by":"crossref","first-page":"84","DOI":"10.1145\/3065386","article-title":"ImageNet classification with deep convolutional neural networks","volume":"60","author":"A Krizhevsky","year":"2017","journal-title":"Commun ACM"},{"key":"pcbi.1009803.ref041","doi-asserted-by":"crossref","first-page":"290","DOI":"10.3389\/fpsyt.2018.00290","article-title":"A Deep Learning Approach for Predicting Antidepressant Response in Major Depression Using Clinical and Genetic Biomarkers","volume":"9","author":"E Lin","year":"2018","journal-title":"Front Psychiatry"},{"key":"pcbi.1009803.ref042","doi-asserted-by":"crossref","first-page":"257","DOI":"10.1007\/s11604-018-0726-3","article-title":"Deep learning with convolutional neural network in radiology","volume":"36","author":"K Yasaka","year":"2018","journal-title":"Jpn J Radiol"},{"key":"pcbi.1009803.ref043","doi-asserted-by":"crossref","first-page":"1437","DOI":"10.1364\/OPTICA.4.001437","article-title":"Deep learning microscopy","volume":"4","author":"Y Rivenson","year":"2017","journal-title":"Optica"},{"key":"pcbi.1009803.ref044","doi-asserted-by":"crossref","first-page":"813","DOI":"10.1093\/jamia\/ocw180","article-title":"Deep learning for pharmacovigilance: recurrent neural network architectures for labeling adverse drug reactions in Twitter posts","volume":"24","author":"A Cocos","year":"2017","journal-title":"J Am Med Inform Assoc"},{"key":"pcbi.1009803.ref045","doi-asserted-by":"crossref","first-page":"1072","DOI":"10.1111\/2041-210X.13436","article-title":"Deep learning-based methods for individual recognition in small birds","volume":"11","author":"AC Ferreira","year":"2020","journal-title":"Methods Ecol Evol"},{"key":"pcbi.1009803.ref046","article-title":"Deep generative models: Survey","author":"A Oussidi","year":"2018","journal-title":"Institute of Electrical and Electronics Engineers (IEEE)"},{"key":"pcbi.1009803.ref047","doi-asserted-by":"crossref","first-page":"giaa117","DOI":"10.1093\/gigascience\/giaa117","article-title":"Correcting for experiment-specific variability in expression compendia can remove underlying signals","volume":"9","author":"AJ Lee","year":"2020","journal-title":"GigaScience"},{"key":"pcbi.1009803.ref048","unstructured":"Henderson P, Islam R, Bachman P, Pineau J, Precup D, Meger D. Deep Reinforcement Learning that Matters. arXiv. 2019 Jan. Report No.: 1709.06560. Available from: https:\/\/arxiv.org\/abs\/1709.06560"},{"key":"pcbi.1009803.ref049","doi-asserted-by":"crossref","first-page":"10752","DOI":"10.1038\/s41598-019-47148-x","article-title":"Optimization of Molecules via Deep Reinforcement Learning.","volume":"9","author":"Z Zhou","year":"2019","journal-title":"Sci Rep"},{"key":"pcbi.1009803.ref050","article-title":"Easy over hard: a case study on deep learning","author":"W Fu","year":"2017","journal-title":"Association for Computing Machinery (ACM)."},{"key":"pcbi.1009803.ref051","doi-asserted-by":"crossref","first-page":"119","DOI":"10.1186\/s12859-020-3427-8","article-title":"Standard machine learning approaches outperform deep representation learning on phenotype prediction from transcriptomics data","volume":"21","author":"AM Smith","year":"2020","journal-title":"BMC Bioinformatics"},{"key":"pcbi.1009803.ref052","doi-asserted-by":"crossref","first-page":"18","DOI":"10.1038\/s41746-018-0029-1","article-title":"Scalable and accurate deep learning with electronic health records","volume":"1","author":"A Rajkomar","year":"2018","journal-title":"NPJ Digit Med"},{"key":"pcbi.1009803.ref053","doi-asserted-by":"crossref","first-page":"42","DOI":"10.1186\/s13321-017-0226-y","article-title":"Deep-learning: investigating deep neural networks hyper-parameters and comparison of performance to shallow methods for modeling bioactivity data","volume":"9","author":"A Koutsoukas","year":"2017","journal-title":"J Chem"},{"key":"pcbi.1009803.ref054","doi-asserted-by":"crossref","first-page":"43","DOI":"10.1038\/s41746-019-0122-0","article-title":"Deep learning and alternative learning strategies for retrospective real-world clinical data","volume":"2","author":"D Chen","year":"2019","journal-title":"NPJ Digit Med"},{"key":"pcbi.1009803.ref055","unstructured":"Papernot N, McDaniel P. Deep k-Nearest Neighbors: Towards Confident, Interpretable and Robust Deep Learning. arXiv. 2018 Mar. Report No.: 1803.04765. Available from: https:\/\/arxiv.org\/abs\/1803.04765"},{"key":"pcbi.1009803.ref056","unstructured":"Jiang H, Kim B, Guan MY, Gupta M. To Trust Or Not To Trust A Classifier. arXiv. 2018 Oct. Report No.: 1805.11783. Available from: https:\/\/arxiv.org\/abs\/1805.11783"},{"key":"pcbi.1009803.ref057","article-title":"Parameter tuning is a key part of dimensionality reduction via deep variational autoencoders for single cell RNA transcriptomics","author":"Q Hu","year":"2018","journal-title":"Pac Symp Biocomput"},{"key":"pcbi.1009803.ref058","doi-asserted-by":"crossref","first-page":"e1004947","DOI":"10.1371\/journal.pcbi.1004947","article-title":"Ten Simple Rules for Taking Advantage of Git and GitHub","volume":"12","author":"Y Perez-Riverol","year":"2016","journal-title":"PLoS Comput Biol."},{"key":"pcbi.1009803.ref059","doi-asserted-by":"crossref","first-page":"342","DOI":"10.1038\/nbt.3780","article-title":"Reproducibility of computational workflows is automated using continuous analysis","volume":"35","author":"BK Beaulieu-Jones","year":"2017","journal-title":"Nat Biotechnol"},{"key":"pcbi.1009803.ref060","doi-asserted-by":"crossref","first-page":"e1003285","DOI":"10.1371\/journal.pcbi.1003285","article-title":"Ten Simple Rules for Reproducible Computational Research","volume":"9","author":"GK Sandve","year":"2013","journal-title":"PLoS Comput Biol"},{"key":"pcbi.1009803.ref061","unstructured":"Rule A, Birmingham A, Zuniga C, Altintas I, Huang S-C, Knight R, et al. Ten Simple Rules for Reproducible Research in Jupyter Notebooks. arXiv. 2018 Oct. Report No.: 1810.08055. Available from: https:\/\/arxiv.org\/abs\/1810.08055"},{"key":"pcbi.1009803.ref062","doi-asserted-by":"crossref","first-page":"1132","DOI":"10.1038\/s41592-021-01256-7","article-title":"Reproducibility standards for machine learning in the life sciences","volume":"18","author":"BJ Heil","year":"2021","journal-title":"Nat Methods"},{"key":"pcbi.1009803.ref063","unstructured":"NVIDIA. Deep Learning SDK Documentation. 1 Nov 2018. Available from: https:\/\/docs.nvidia.com\/deeplearning\/sdk\/cudnn-developer-guide\/index.html#reproducibility"},{"key":"pcbi.1009803.ref064","article-title":"The Marginal Value of Adaptive Gradient Methods in Machine Learning","volume":"30","author":"AC Wilson","year":"2017","journal-title":"Adv Neural Inf Proces Syst"},{"key":"pcbi.1009803.ref065","article-title":"The Dryad Digital Repository: Published evolutionary data as part of the greater data ecosystem","author":"T. Vision","year":"2010","journal-title":"Nat Prec."},{"key":"pcbi.1009803.ref066","first-page":"138","article-title":"Fig Share","volume":"2","author":"J. Singh","year":"2011","journal-title":"J Pharmacol Pharmacother"},{"key":"pcbi.1009803.ref067","first-page":"e37080","article-title":"Zenodo, an Archive and Publishing Repository: A tale of two herbarium specimen pilot projects.","volume":"3","author":"M Dillen","year":"2019","journal-title":"Biodivers Inf Sci Stand."},{"key":"pcbi.1009803.ref068","first-page":"105","article-title":"Open Science Framework (OSF).","author":"MSLSED Foster","year":"2017","journal-title":"J Med Libr Assoc"},{"key":"pcbi.1009803.ref069","first-page":"56","article-title":"On Reproducible AI: Towards Reproducible Research, Open Science, and Digital Scholarship in AI Publications","volume":"39","author":"OE Gundersen","year":"2018","journal-title":"AI Mag."},{"key":"pcbi.1009803.ref070","doi-asserted-by":"crossref","first-page":"365","DOI":"10.1038\/ng1201-365","article-title":"Minimum information about a microarray experiment (MIAME)\u2014toward standards for microarray data","volume":"29","author":"A Brazma","year":"2001","journal-title":"Nat Genet"},{"key":"pcbi.1009803.ref071","doi-asserted-by":"crossref","first-page":"733","DOI":"10.1038\/nrg2825","article-title":"Tackling the widespread and critical impact of batch effects in high-throughput data","volume":"11","author":"JT Leek","year":"2010","journal-title":"Nat Rev Genet"},{"key":"pcbi.1009803.ref072","volume-title":"Lecture Notes in Computer Science","year":"2012"},{"key":"pcbi.1009803.ref073","unstructured":"Bai S, Kolter JZ, Koltun V. An Empirical Evaluation of Generic Convolutional and Recurrent Networks for Sequence Modeling. arXiv. 2018 Apr. Report No.: 1803.01271. Available from: https:\/\/arxiv.org\/abs\/1803.01271"},{"key":"pcbi.1009803.ref074","unstructured":"Vaswani A, Shazeer N, Parmar N, Uszkoreit J, Jones L, Gomez AN, et al. Attention Is All You Need. arXiv. 2017 Dec. Report No.: 1706.03762. Available from: https:\/\/arxiv.org\/abs\/1706.03762"},{"key":"pcbi.1009803.ref075","doi-asserted-by":"crossref","first-page":"89","DOI":"10.1016\/j.ymeth.2020.06.016","article-title":"Machine learning and AI-based approaches for bioactive ligand discovery and GPCR-ligand recognition","volume":"180","author":"S Raschka","year":"2020","journal-title":"Methods"},{"key":"pcbi.1009803.ref076","doi-asserted-by":"crossref","first-page":"436","DOI":"10.1038\/nature14539","article-title":"Deep learning","volume":"521","author":"Y LeCun","year":"2015","journal-title":"Nature"},{"key":"pcbi.1009803.ref077","unstructured":"Yosinski J, Clune J, Bengio Y, Lipson H. How transferable are features in deep neural networks? Proceedings of the 27th International Conference on Neural Information Processing Systems\u2014Volume 2. Cambridge, MA, USA: MIT Press; 2014. p. 3320\u20133328. Available from: https:\/\/dl.acm.org\/doi\/abs\/10.5555\/2969033.2969197"},{"key":"pcbi.1009803.ref078","doi-asserted-by":"crossref","first-page":"211","DOI":"10.1007\/s11263-015-0816-y","article-title":"ImageNet Large Scale Visual Recognition Challenge","volume":"115","author":"O Russakovsky","year":"2015","journal-title":"Int J Comput Vis"},{"key":"pcbi.1009803.ref079","doi-asserted-by":"crossref","first-page":"95","DOI":"10.1007\/s10278-016-9914-9","article-title":"High-Throughput Classification of Radiographs Using Deep Convolutional Neural Networks","volume":"30","author":"A Rajkomar","year":"2016","journal-title":"J Digit Imaging"},{"key":"pcbi.1009803.ref080","doi-asserted-by":"crossref","first-page":"592","DOI":"10.1038\/s41587-019-0140-0","article-title":"The Kipoi repository accelerates community exchange and reuse of predictive models for genomics","volume":"37","author":"\u017d Avsec","year":"2019","journal-title":"Nat Biotechnol"},{"key":"pcbi.1009803.ref081","article-title":"Transformers: State-of-the-Art Natural Language Processing","author":"T Wolf","year":"2020","journal-title":"Association for Computational Linguistics (ACL)."},{"key":"pcbi.1009803.ref082","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3458754","article-title":"Domain-Specific Language Model Pretraining for Biomedical Natural Language Processing","volume":"3","author":"Y Gu","year":"2022","journal-title":"ACM Transactions on Computing for Healthcare"},{"key":"pcbi.1009803.ref083","unstructured":"Chithrananda S, Grand G, Ramsundar B. Chem BERTa: Large-Scale Self-Supervised Pretraining for Molecular Property Prediction. arXiv. 2020 Oct. Report No.: 2010.09885. Available from: https:\/\/arxiv.org\/abs\/2010.09885"},{"key":"pcbi.1009803.ref084","article-title":"CNN Features Off-the-Shelf: An Astounding Baseline for Recognition","author":"AS Razavian","year":"2014","journal-title":"Institute of Electrical and Electronics Engineers (IEEE)."},{"key":"pcbi.1009803.ref085","doi-asserted-by":"crossref","first-page":"55","DOI":"10.1016\/j.micron.2018.01.010","article-title":"Fast and robust segmentation of white blood cell images by self-supervised learning","volume":"107","author":"X Zheng","year":"2018","journal-title":"Micron"},{"key":"pcbi.1009803.ref086","doi-asserted-by":"crossref","first-page":"322","DOI":"10.1109\/TBDATA.2016.2573280","article-title":"Deep Model Based Transfer and Multi-Task Learning for Biological Image Analysis","volume":"6","author":"W Zhang","year":"2020","journal-title":"IEEE Transactions on Big Data"},{"key":"pcbi.1009803.ref087","doi-asserted-by":"crossref","first-page":"861","DOI":"10.1016\/S0893-6080(05)80131-5","article-title":"Multilayer feedforward networks with a nonpolynomial activation function can approximate any function","volume":"6","author":"M Leshno","year":"1993","journal-title":"Neural Netw"},{"key":"pcbi.1009803.ref088","first-page":"1929","article-title":"Dropout: a simple way to prevent neural networks from overfitting","volume":"15","author":"N Srivastava","year":"2014","journal-title":"J Mach Learn Res"},{"key":"pcbi.1009803.ref089","unstructured":"Ioffe S, Szegedy C. Batch normalization: accelerating deep network training by reducing internal covariate shift. Proceedings of the 32nd International Conference on International Conference on Machine Learning\u2014Volume 37. Lille, France: JMLR.org; 2015. p. 448\u2013456. Available from: https:\/\/dl.acm.org\/citation.cfm?id=3045118.3045167"},{"key":"pcbi.1009803.ref090","doi-asserted-by":"crossref","first-page":"15849","DOI":"10.1073\/pnas.1903070116","article-title":"Reconciling modern machine-learning practice and the classical bias\u2013variance trade-off","volume":"116","author":"M Belkin","year":"2019","journal-title":"Proc Natl Acad Sci"},{"key":"pcbi.1009803.ref091","unstructured":"Raschka S. Model Evaluation, Model Selection, and Algorithm Selection in Machine Learning. arXiv. 2020 Nov. Report No.: 1811.12808. Available from: https:\/\/arxiv.org\/abs\/1811.12808"},{"key":"pcbi.1009803.ref092","doi-asserted-by":"crossref","first-page":"1895","DOI":"10.1162\/089976698300017197","article-title":"Approximate Statistical Tests for Comparing Supervised Classification Learning Algorithms","volume":"10","author":"TG Dietterich","year":"1998","journal-title":"Neural Comput."},{"key":"pcbi.1009803.ref093","first-page":"1929","article-title":"Dropout: A Simple Way to Prevent Neural Networks from Overfitting","volume":"15","author":"N Srivastava","year":"2014","journal-title":"J Mach Learn Res."},{"key":"pcbi.1009803.ref094","unstructured":"Krogh A, Hertz JA. A simple weight decay can improve generalization. Proceedings of the 4th International Conference on Neural Information Processing Systems. San Francisco, CA, USA: Morgan Kaufmann Publishers Inc. 1991. p. 950\u2013957. Available from: http:\/\/dl.acm.org\/citation.cfm?id=2986916.2987033"},{"key":"pcbi.1009803.ref095","doi-asserted-by":"crossref","first-page":"2819","DOI":"10.1021\/acschembio.8b00881","article-title":"Adversarial Controls for Scientific Machine Learning","volume":"13","author":"KV Chuang","year":"2018","journal-title":"ACS Chem Biol"},{"key":"pcbi.1009803.ref096","doi-asserted-by":"crossref","first-page":"e0118432","DOI":"10.1371\/journal.pone.0118432","article-title":"The precision-recall plot is more informative than the ROC plot when evaluating binary classifiers on imbalanced datasets","volume":"10","author":"T Saito","year":"2015","journal-title":"PLoS ONE"},{"key":"pcbi.1009803.ref097","doi-asserted-by":"crossref","first-page":"4462","DOI":"10.1021\/acs.molpharmaceut.7b00578","article-title":"Comparison of Deep Learning With Multiple Machine Learning Methods and Metrics Using Diverse Drug Discovery Data Sets","volume":"14","author":"A Korotcov","year":"2017","journal-title":"Mol Pharm"},{"key":"pcbi.1009803.ref098","article-title":"The relationship between Precision-Recall and ROC curves","author":"J Davis","year":"2006","journal-title":"Association for Computing Machinery (ACM)."},{"key":"pcbi.1009803.ref099","doi-asserted-by":"crossref","first-page":"e1002683","DOI":"10.1371\/journal.pmed.1002683","article-title":"Variable generalization performance of a deep learning model to detect pneumonia in chest radiographs: A cross-sectional study","volume":"15","author":"JR Zech","year":"2018","journal-title":"PLoS Med"},{"key":"pcbi.1009803.ref100","doi-asserted-by":"crossref","first-page":"831","DOI":"10.1093\/bib\/bbv082","article-title":"Correct machine learning on protein sequences: a peer-reviewing perspective","volume":"17","author":"I Walsh","year":"2016","journal-title":"Brief Bioinform"},{"key":"pcbi.1009803.ref101","first-page":"454","article-title":"Machine Learning to Identify Flexibility Signatures of Class A GPCR Inhibition","volume":"10","author":"J Bemister-Buffington","year":"2020","journal-title":"Biomol Ther."},{"key":"pcbi.1009803.ref102","volume-title":"Methods in Molecular Biology","author":"S Raschka","year":"2018"},{"key":"pcbi.1009803.ref103","doi-asserted-by":"crossref","first-page":"4","DOI":"10.1109\/JBHI.2016.2636665","article-title":"Deep Learning for Health Informatics","volume":"21","author":"D Ravi","year":"2017","journal-title":"IEEE J Biomed Health Inform"},{"key":"pcbi.1009803.ref104","doi-asserted-by":"crossref","first-page":"709","DOI":"10.1038\/s41551-018-0315-x","article-title":"Towards trustable machine learning","volume":"2","year":"2018","journal-title":"Nat Biomed Eng"},{"key":"pcbi.1009803.ref105","unstructured":"Fan F, Xiong J, Li M, Wang G. On Interpretability of Artificial Neural Networks: A Survey. arXiv. 2021 Sep. Report No.: 2001.02522. Available from: https:\/\/arxiv.org\/abs\/2001.02522"},{"key":"pcbi.1009803.ref106","unstructured":"Molnar C. Interpretable Machine Learning. Available from: https:\/\/christophm.github.io\/interpretable-ml-book\/"},{"key":"pcbi.1009803.ref107","doi-asserted-by":"crossref","first-page":"107","DOI":"10.1016\/S0933-3657(96)00367-3","article-title":"An evaluation of machine-learning methods for predicting pneumonia mortality","volume":"9","author":"GF Cooper","year":"1997","journal-title":"Artif Intell Med"},{"key":"pcbi.1009803.ref108","article-title":"Intelligible Models for HealthCare","author":"R Caruana","year":"2015","journal-title":"Association for Computing Machinery (ACM)."},{"key":"pcbi.1009803.ref109","doi-asserted-by":"crossref","first-page":"426","DOI":"10.1038\/s42256-020-0218-x","article-title":"When causal inference meets deep learning","volume":"2","author":"Y Luo","year":"2020","journal-title":"Nat Mach Intell"},{"key":"pcbi.1009803.ref110","doi-asserted-by":"crossref","first-page":"36","DOI":"10.1002\/hast.977","article-title":"Deep Ethical Learning: Taking the Interplay of Human and Artificial Intelligence Seriously","volume":"49","author":"A. Ho","year":"2019","journal-title":"Hastings Cent Rep"},{"key":"pcbi.1009803.ref111","doi-asserted-by":"crossref","first-page":"1139","DOI":"10.1377\/hlthaff.2014.0048","article-title":"The Legal And Ethical Concerns That Arise From Using Complex Predictive Analytics In Health Care","volume":"33","author":"IG Cohen","year":"2014","journal-title":"Health Aff."},{"key":"pcbi.1009803.ref112","article-title":"Model Cards for Model Reporting","author":"M Mitchell","year":"2019","journal-title":"Association for Computing Machinery (ACM)."},{"key":"pcbi.1009803.ref113","unstructured":"American Society for Bioethics and Humanities. [cited 2021 Nov 29]. Available from: https:\/\/asbh.org\/"},{"key":"pcbi.1009803.ref114","unstructured":"10 organizations leading the way in ethical AI\u2014SAGE Ocean | Big Data, New Tech, Social Science. 2021 Jan 12 [cited 2021 Nov 29]. Available from: https:\/\/web.archive.org\/web\/20210112231619\/https:\/\/ocean.sagepub.com\/blog\/10-organizations-leading-the-way-in-ethical-ai"},{"key":"pcbi.1009803.ref115","unstructured":"Artificial Intelligence, Ethics, and Society\u2014Home. [cited 2021 Nov 29]. Available from: https:\/\/www.aies-conference.com\/2021\/"},{"key":"pcbi.1009803.ref116","doi-asserted-by":"crossref","first-page":"e1005399","DOI":"10.1371\/journal.pcbi.1005399","article-title":"Ten simple rules for responsible big data research","volume":"13","author":"M Zook","year":"2017","journal-title":"PLoS Comput Biol"},{"key":"pcbi.1009803.ref117","doi-asserted-by":"crossref","first-page":"615","DOI":"10.1038\/s41576-020-0257-5","article-title":"Responsible, practical genomic data sharing that accelerates research","volume":"21","author":"JB Byrd","year":"2020","journal-title":"Nat Rev Genet"},{"key":"pcbi.1009803.ref118","article-title":"Model Inversion Attacks that Exploit Confidence Information and Basic Countermeasures","author":"M Fredrikson","year":"2015","journal-title":"Association for Computing Machinery (ACM)."},{"key":"pcbi.1009803.ref119","doi-asserted-by":"crossref","unstructured":"Shokri R, Stronati M, Song C, Shmatikov V. Membership Inference Attacks against Machine Learning Models. arXiv. 2017 Apr. Report No.: 1610.05820. Available from: https:\/\/arxiv.org\/abs\/1610.05820","DOI":"10.1109\/SP.2017.41"},{"key":"pcbi.1009803.ref120","unstructured":"Duvenaud D, Maclaurin D, Aguilera-Iparraguirre J, G\u00f3mez-Bombarelli R, Hirzel T, Aspuru-Guzik A, et al. Convolutional Networks on Graphs for Learning Molecular Fingerprints. arXiv. 2015 Nov. Report No.: 1509.09292. Available from: https:\/\/arxiv.org\/abs\/1509.09292"},{"key":"pcbi.1009803.ref121","doi-asserted-by":"crossref","first-page":"e1006454","DOI":"10.1371\/journal.pcbi.1006454","article-title":"SIG-DB: Leveraging homomorphic encryption to securely interrogate privately held genomic databases","volume":"14","author":"AJ Titus","year":"2018","journal-title":"PLoS Comput Biol"},{"key":"pcbi.1009803.ref122","unstructured":"Badawi AA, Chao J, Lin J, Mun CF, Sim JJ, Tan BHM, et al. Towards the AlexNet Moment for Homomorphic Encryption: HCNN, theFirst Homomorphic CNN on Encrypted Data with GPUs. arXiv. 2020 Aug. Report No.: 1811.00778. Available from: https:\/\/arxiv.org\/abs\/1811.00778"},{"key":"pcbi.1009803.ref123","unstructured":"Ryffel T, Trask A, Dahl M, Wagner B, Mancuso J, Rueckert D, et al. A generic framework for privacy preserving deep learning. arXiv. 2018 Nov. Report No.: 1811.04017. Available from: https:\/\/arxiv.org\/abs\/1811.04017"},{"key":"pcbi.1009803.ref124","article-title":"Deep Learning with Differential Privacy","author":"M Abadi","year":"2016","journal-title":"Association for Computing Machinery (ACM)"},{"key":"pcbi.1009803.ref125","article-title":"Privacy-Preserving Generative Deep Neural Networks Support Clinical Data Sharing","volume":"12","author":"BK Beaulieu-Jones","year":"2019","journal-title":"Circ Cardiovasc Qual Outcomes"},{"key":"pcbi.1009803.ref126","unstructured":"Beaulieu-Jones BK, Yuan W, Finlayson SG, Wu ZS. Privacy-Preserving Distributed Deep Learning for Clinical Data. arXiv. 2018 Dec. Report No.: 1812.01484. Available from: https:\/\/arxiv.org\/abs\/1812.01484"},{"key":"pcbi.1009803.ref127","doi-asserted-by":"crossref","first-page":"104716","DOI":"10.1016\/j.compbiomed.2021.104716","article-title":"Privacy preserving distributed learning classifiers\u2013Sequential learning with small sets of data","volume":"136","author":"F Zerka","year":"2021","journal-title":"Comput Biol Med"}],"container-title":["PLOS Computational Biology"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/dx.plos.org\/10.1371\/journal.pcbi.1009803","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,3,24]],"date-time":"2022-03-24T21:24:17Z","timestamp":1648157057000},"score":1,"resource":{"primary":{"URL":"https:\/\/dx.plos.org\/10.1371\/journal.pcbi.1009803"}},"subtitle":[],"editor":[{"given":"Francis","family":"Ouellette","sequence":"first","affiliation":[]}],"short-title":[],"issued":{"date-parts":[[2022,3,24]]},"references-count":127,"journal-issue":{"issue":"3","published-online":{"date-parts":[[2022,3,24]]}},"URL":"https:\/\/doi.org\/10.1371\/journal.pcbi.1009803","relation":{},"ISSN":["1553-7358"],"issn-type":[{"value":"1553-7358","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,3,24]]}}}