{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,29]],"date-time":"2026-03-29T05:00:58Z","timestamp":1774760458858,"version":"3.50.1"},"reference-count":28,"publisher":"Oxford University Press (OUP)","issue":"3","license":[{"start":{"date-parts":[[2023,3,22]],"date-time":"2023-03-22T00:00:00Z","timestamp":1679443200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/academic.oup.com\/journals\/pages\/open_access\/funder_policies\/chorus\/standard_publication_model"}],"funder":[{"name":"Ministry of Research"},{"name":"Universit\u00e9 Paris Cit\u00e9"},{"DOI":"10.13039\/501100000272","name":"National Institute for Health and Medical Research","doi-asserted-by":"crossref","award":["ANR-18-IDEX-0001"],"award-info":[{"award-number":["ANR-18-IDEX-0001"]}],"id":[{"id":"10.13039\/501100000272","id-type":"DOI","asserted-by":"crossref"}]},{"name":"Laboratory of Excellence GR-Ex","award":["ANR-11-LABX-0051"],"award-info":[{"award-number":["ANR-11-LABX-0051"]}]},{"name":"Laboratory of Excellence GR-Ex","award":["ANR-11-IDEX-0005-02"],"award-info":[{"award-number":["ANR-11-IDEX-0005-02"]}]},{"DOI":"10.13039\/501100001665","name":"French National Research Agency","doi-asserted-by":"publisher","award":["ANR-21-CE45-0019"],"award-info":[{"award-number":["ANR-21-CE45-0019"]}],"id":[{"id":"10.13039\/501100001665","id-type":"DOI","asserted-by":"publisher"}]},{"name":"High Performance Computing"},{"name":"Institut du D\u00e9veloppement et Des Ressources en Informatique Scientifique, France","award":["A0050710640"],"award-info":[{"award-number":["A0050710640"]}]},{"name":"Institut du D\u00e9veloppement et Des Ressources en Informatique Scientifique, France","award":["A0010710172"],"award-info":[{"award-number":["A0010710172"]}]},{"name":"Tr\u00e8s Grand Centre de Calcul","award":["A0090712053"],"award-info":[{"award-number":["A0090712053"]}]},{"name":"Tr\u00e8s Grand Centre de Calcul","award":["A0110712053"],"award-info":[{"award-number":["A0110712053"]}]},{"name":"Grand Equipement National de Calcul Intensif, France"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,5,19]]},"abstract":"<jats:title>Abstract<\/jats:title>\n               <jats:p>In the era of constantly increasing amounts of the available protein data, a relevant and interpretable visualization becomes crucial, especially for tasks requiring human expertise. Poincar\u00e9 disk projection has previously demonstrated its important efficiency for visualization of biological data such as single-cell RNAseq data. Here, we develop a new method Poincar\u00e9MSA for visual representation of complex relationships between protein sequences based on Poincar\u00e9 maps embedding. We demonstrate its efficiency and potential for visualization of protein family topology as well as evolutionary and functional annotation of uncharacterized sequences. Poincar\u00e9MSA is implemented in open source Python code with available interactive Google Colab notebooks as described at https:\/\/www.dsimb.inserm.fr\/POINCARE_MSA.<\/jats:p>","DOI":"10.1093\/bib\/bbad103","type":"journal-article","created":{"date-parts":[[2023,3,22]],"date-time":"2023-03-22T11:49:47Z","timestamp":1679485787000},"source":"Crossref","is-referenced-by-count":6,"title":["Poincar\u00e9 maps for visualization of large protein families"],"prefix":"10.1093","volume":"24","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-1057-6690","authenticated-orcid":false,"given":"Anna Klimovskaia","family":"Susmelj","sequence":"first","affiliation":[{"name":"Swiss Data Science Center, ETH Zurich and EPFL , Zurich , Switzerland"},{"name":"Biognosys AG , Wagistrasse 21, 8952 Schlieren , Switzerland"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yani","family":"Ren","sequence":"additional","affiliation":[{"name":"Universit\u00e9 Paris Cit\u00e9 and Universit\u00e9 des Antilles and Universit\u00e9 de la R\u00e9union, INSERM, BIGR , F-75014 Paris , France"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6680-8104","authenticated-orcid":false,"given":"Yann","family":"Vander Meersche","sequence":"additional","affiliation":[{"name":"Universit\u00e9 Paris Cit\u00e9 and Universit\u00e9 des Antilles and Universit\u00e9 de la R\u00e9union, INSERM, BIGR , F-75014 Paris , France"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5138-361X","authenticated-orcid":false,"given":"Jean-Christophe","family":"Gelly","sequence":"additional","affiliation":[{"name":"Universit\u00e9 Paris Cit\u00e9 and Universit\u00e9 des Antilles and Universit\u00e9 de la R\u00e9union, INSERM, BIGR , F-75014 Paris , France"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3608-5208","authenticated-orcid":false,"given":"Tatiana","family":"Galochkina","sequence":"additional","affiliation":[{"name":"Universit\u00e9 Paris Cit\u00e9 and Universit\u00e9 des Antilles and Universit\u00e9 de la R\u00e9union, INSERM, BIGR , F-75014 Paris , France"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"286","published-online":{"date-parts":[[2023,3,22]]},"reference":[{"key":"2023052021590901000_ref1","volume-title":"Xfam Blog","author":"Pfam 34.0 is released","year":"2021"},{"key":"2023052021590901000_ref2","doi-asserted-by":"crossref","first-page":"932","DOI":"10.1038\/s41587-021-01179-w","article-title":"Using deep learning to annotate the protein universe","volume":"40","author":"Bileschi","year":"2022","journal-title":"Nat Biotechnol"},{"key":"2023052021590901000_ref3","first-page":"2579","article-title":"Visualizing data using t-SNE","volume":"9","author":"Maaten","year":"2008","journal-title":"J Machine Learning Res"},{"key":"2023052021590901000_ref4","doi-asserted-by":"crossref","first-page":"861","DOI":"10.21105\/joss.00861","article-title":"UMAP: uniform manifold approximation and projection","volume":"3","author":"McInnes","year":"2018","journal-title":"J Open Source Softw"},{"key":"2023052021590901000_ref5","volume-title":"Metric Structures for Riemannian and Non-Riemannian Spaces","author":"Gromov","year":"2007"},{"key":"2023052021590901000_ref6","doi-asserted-by":"crossref","first-page":"2966","DOI":"10.1038\/s41467-020-16822-4","article-title":"Poincar\u00e9 maps for analyzing complex hierarchies in single-cell data","volume":"11","author":"Klimovskaia","year":"2020","journal-title":"Nat Commun"},{"key":"2023052021590901000_ref7","doi-asserted-by":"crossref","first-page":"bpab006","DOI":"10.1093\/biomethods\/bpab006","article-title":"Novel metric for hyperbolic phylogenetic tree embeddings","volume":"6","author":"Matsumoto","year":"2021","journal-title":"Biol Methods Protoc"},{"key":"2023052021590901000_ref8","doi-asserted-by":"crossref","first-page":"574","DOI":"10.1016\/0022-2836(94)90032-9","article-title":"Position-based sequence weights","volume":"243","author":"Henikoff","year":"1994","journal-title":"J Mol Biol"},{"key":"2023052021590901000_ref9","doi-asserted-by":"crossref","first-page":"135","DOI":"10.1093\/bioinformatics\/12.2.135","article-title":"Using substitution probabilities to improve position-specific scoring matrices","volume":"12","author":"Henikoff","year":"1996","journal-title":"Bioinformatics"},{"key":"2023052021590901000_ref10","doi-asserted-by":"crossref","first-page":"203D","DOI":"10.1093\/nar\/gkh027","article-title":"HOMSTRAD: recent developments of the homologous protein structure alignment database","volume":"32","author":"Stebbings","year":"2004","journal-title":"Nucleic Acids Res"},{"key":"2023052021590901000_ref11","doi-asserted-by":"crossref","first-page":"2856","DOI":"10.1093\/bioinformatics\/bty1057","article-title":"MMseqs2 desktop and local web server app for fast, interactive sequence searches","volume":"35","author":"Mirdita","year":"2019","journal-title":"Bioinformatics"},{"key":"2023052021590901000_ref12","doi-asserted-by":"crossref","first-page":"1026","DOI":"10.1038\/nbt.3988","article-title":"MMseqs2 enables sensitive protein sequence searching for the analysis of massive data sets","volume":"35","author":"Steinegger","year":"2017","journal-title":"Nat Biotechnol"},{"key":"2023052021590901000_ref13","doi-asserted-by":"crossref","first-page":"3029","DOI":"10.1093\/bioinformatics\/btab184","article-title":"Fast and sensitive taxonomic assignment to metagenomic contigs","volume":"37","author":"Mirdita","year":"2021","journal-title":"Bioinformatics"},{"key":"2023052021590901000_ref14","doi-asserted-by":"crossref","first-page":"473","DOI":"10.1186\/s12859-019-3019-7","article-title":"HH-suite3 for fast remote homology detection and deep protein annotation","volume":"20","author":"Steinegger","year":"2019","journal-title":"BMC Bioinformatics"},{"key":"2023052021590901000_ref15","doi-asserted-by":"crossref","first-page":"173","DOI":"10.1038\/nmeth.1818","article-title":"HHblits: lightning-fast iterative protein sequence searching by HMM-HMM alignment","volume":"9","author":"Remmert","year":"2012","journal-title":"Nat Methods"},{"key":"2023052021590901000_ref16","doi-asserted-by":"crossref","first-page":"D12","DOI":"10.1093\/nar\/gkw1071","article-title":"Database Resources of the National Center for Biotechnology information","volume":"45","author":"NCBI Resource Coordinators","year":"2017","journal-title":"Nucleic Acids Res"},{"key":"2023052021590901000_ref17","doi-asserted-by":"crossref","first-page":"2248","DOI":"10.1016\/j.patrec.2010.04.013","article-title":"Scale-independent quality criteria for dimensionality reduction","volume":"31","author":"Lee","year":"2010","journal-title":"Pattern Recognit Lett"},{"key":"2023052021590901000_ref18","doi-asserted-by":"crossref","first-page":"31","DOI":"10.1186\/1471-2148-6-31","article-title":"A phylogenomic profile of globins","volume":"6","author":"Vinogradov","year":"2006","journal-title":"BMC Evol Biol"},{"key":"2023052021590901000_ref19","doi-asserted-by":"crossref","DOI":"10.1016\/j.redox.2020.101687","article-title":"Lessons from the post-genomic era: globin diversity beyond oxygen binding and transport","volume":"37","author":"Keppner","year":"2020","journal-title":"Redox Biol"},{"key":"2023052021590901000_ref20","doi-asserted-by":"crossref","first-page":"D506","DOI":"10.1093\/nar\/gky1049","article-title":"UniProt: a worldwide hub of protein knowledge","volume":"47","author":"The UniProt Consortium","year":"2019","journal-title":"Nucleic Acids Res"},{"key":"2023052021590901000_ref21","doi-asserted-by":"crossref","first-page":"592","DOI":"10.1038\/nsmb.2020","article-title":"Single-molecule paleoenzymology probes the chemistry of resurrected enzymes","volume":"18","author":"Perez-Jimenez","year":"2011","journal-title":"Nat Struct Mol Biol"},{"key":"2023052021590901000_ref22","doi-asserted-by":"crossref","first-page":"890","DOI":"10.1038\/nsmb.1627","article-title":"Diversity of chemical mechanisms in thioredoxin catalysis revealed by single-molecule force spectroscopy","volume":"16","author":"Perez-Jimenez","year":"2009","journal-title":"Nat Struct Mol Biol"},{"key":"2023052021590901000_ref23","doi-asserted-by":"crossref","first-page":"1912","DOI":"10.1126\/science.1075762","article-title":"The protein kinase complement of the human genome","volume":"298","author":"Manning","year":"2002","journal-title":"Science"},{"key":"2023052021590901000_ref24","doi-asserted-by":"crossref","first-page":"19790","DOI":"10.1038\/s41598-019-56499-4","article-title":"A structurally-validated multiple sequence alignment of 497 human protein kinase domains","volume":"9","author":"Modi","year":"2019","journal-title":"Sci Rep"},{"key":"2023052021590901000_ref25","doi-asserted-by":"crossref","first-page":"2619","DOI":"10.1098\/rstb.2012.0003","article-title":"Diversity, classification and function of the plant protein kinase superfamily","volume":"367","author":"Lehti-Shiu","year":"2012","journal-title":"Philos Trans R Soc B Biol Sci"},{"key":"2023052021590901000_ref26","doi-asserted-by":"crossref","DOI":"10.1371\/journal.pone.0001076","article-title":"Phylogenetic analysis of the Neks reveals early diversification of ciliary-cell cycle kinases","volume":"2","author":"Parker","year":"2007","journal-title":"PloS One"},{"key":"2023052021590901000_ref27","doi-asserted-by":"crossref","first-page":"5644","DOI":"10.1038\/s41467-019-13633-0","article-title":"Deciphering protein evolution and fitness landscapes with latent space models","volume":"10","author":"Ding","year":"2019","journal-title":"Nat Commun"},{"key":"2023052021590901000_ref28","doi-asserted-by":"crossref","first-page":"1914","DOI":"10.1038\/s41467-022-29443-w","article-title":"Learning meaningful representations of protein sequences","volume":"13","author":"Detlefsen","year":"2022","journal-title":"Nat Commun"}],"container-title":["Briefings in Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/academic.oup.com\/bib\/article-pdf\/24\/3\/bbad103\/50410393\/bbad103.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bib\/article-pdf\/24\/3\/bbad103\/50410393\/bbad103.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,5,20]],"date-time":"2023-05-20T21:59:46Z","timestamp":1684619986000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/bib\/article\/doi\/10.1093\/bib\/bbad103\/7083418"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,3,22]]},"references-count":28,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2023,5,19]]}},"URL":"https:\/\/doi.org\/10.1093\/bib\/bbad103","relation":{},"ISSN":["1467-5463","1477-4054"],"issn-type":[{"value":"1467-5463","type":"print"},{"value":"1477-4054","type":"electronic"}],"subject":[],"published-other":{"date-parts":[[2023,5]]},"published":{"date-parts":[[2023,3,22]]},"article-number":"bbad103"}}