{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,16]],"date-time":"2026-01-16T08:24:57Z","timestamp":1768551897531,"version":"3.49.0"},"reference-count":51,"publisher":"Oxford University Press (OUP)","issue":"4","license":[{"start":{"date-parts":[[2024,7,10]],"date-time":"2024-07-10T00:00:00Z","timestamp":1720569600000},"content-version":"vor","delay-in-days":48,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"name":"JSPS KAKENHI","award":["21 K06663"],"award-info":[{"award-number":["21 K06663"]}]},{"DOI":"10.13039\/501100001691","name":"Japan Society for the Promotion of Science","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001691","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100007449","name":"Takeda Science Foundation","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100007449","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100005865","name":"Mochida Memorial Foundation for Medical and Pharmaceutical Research","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100005865","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,5,23]]},"abstract":"<jats:title>Abstract<\/jats:title>\n               <jats:p>Inferring cell type proportions from bulk transcriptome data is crucial in immunology and oncology. Here, we introduce guided LDA deconvolution (GLDADec), a bulk deconvolution method that guides topics using cell type-specific marker gene names to estimate topic distributions for each sample. Through benchmarking using blood-derived datasets, we demonstrate its high estimation performance and robustness. Moreover, we apply GLDADec to heterogeneous tissue bulk data and perform comprehensive cell type analysis in a data-driven manner. We show that GLDADec outperforms existing methods in estimation performance and evaluate its biological interpretability by examining enrichment of biological processes for topics. Finally, we apply GLDADec to The Cancer Genome Atlas tumor samples, enabling subtype stratification and survival analysis based on estimated cell type proportions, thus proving its practical utility in clinical settings. This approach, utilizing marker gene names as partial prior information, can be applied to various scenarios for bulk data deconvolution. GLDADec is available as an open-source Python package at https:\/\/github.com\/mizuno-group\/GLDADec.<\/jats:p>","DOI":"10.1093\/bib\/bbae315","type":"journal-article","created":{"date-parts":[[2024,7,10]],"date-time":"2024-07-10T00:16:26Z","timestamp":1720570586000},"source":"Crossref","is-referenced-by-count":5,"title":["GLDADec: marker-gene guided LDA modeling for bulk gene expression deconvolution"],"prefix":"10.1093","volume":"25","author":[{"given":"Iori","family":"Azuma","sequence":"first","affiliation":[{"name":"Graduate School of Pharmaceutical Sciences, The University of Tokyo , 7-3-1, Bunkyo-ku 113-0033 , Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1638-602X","authenticated-orcid":false,"given":"Tadahaya","family":"Mizuno","sequence":"additional","affiliation":[{"name":"Graduate School of Pharmaceutical Sciences, The University of Tokyo , 7-3-1, Bunkyo-ku 113-0033 , Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hiroyuki","family":"Kusuhara","sequence":"additional","affiliation":[{"name":"Graduate School of Pharmaceutical Sciences, The University of Tokyo , 7-3-1, Bunkyo-ku 113-0033 , Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"286","published-online":{"date-parts":[[2024,7,10]]},"reference":[{"key":"2024071000155438900_ref1","doi-asserted-by":"crossref","first-page":"474","DOI":"10.1056\/NEJMra021844","article-title":"Drug-induced hepatotoxicity","volume":"349","author":"Lee","year":"2003","journal-title":"N Engl J Med"},{"key":"2024071000155438900_ref2","doi-asserted-by":"crossref","first-page":"884","DOI":"10.1016\/j.devcel.2010.05.012","article-title":"Tumors as organs: complex tissues that Interface with the entire organism","volume":"18","author":"Egeblad","year":"2010","journal-title":"Dev Cell"},{"key":"2024071000155438900_ref3","first-page":"93","article-title":"The gene expression omnibus","author":"Clough","year":"2016","journal-title":"Database"},{"key":"2024071000155438900_ref4","doi-asserted-by":"crossref","first-page":"580","DOI":"10.1038\/ng.2653","article-title":"The genotype-tissue expression (GTEx) project","volume":"45","author":"Lonsdale","year":"2013","journal-title":"Nat Genet"},{"key":"2024071000155438900_ref5","doi-asserted-by":"crossref","first-page":"1366","DOI":"10.1038\/s41467-018-03751-6","article-title":"Massive mining of publicly available RNA-seq data from human and mouse","volume":"9","author":"Lachmann","year":"2018","journal-title":"Nat Commun"},{"key":"2024071000155438900_ref6","doi-asserted-by":"crossref","first-page":"41","DOI":"10.1038\/nmeth.2694","article-title":"Quantitative assessment of single-cell RNA-sequencing methods","volume":"11","author":"Wu","year":"2014","journal-title":"Nat Methods"},{"key":"2024071000155438900_ref7","doi-asserted-by":"crossref","DOI":"10.1371\/journal.pcbi.1006976","article-title":"Fast and robust deconvolution of tumor infiltrating lymphocyte from expression profiles using least trimmed squares","volume":"15","author":"Hao","year":"2019","journal-title":"PLoS Comput Biol"},{"key":"2024071000155438900_ref8","doi-asserted-by":"crossref","first-page":"6","DOI":"10.7554\/eLife.26476","article-title":"Simultaneous enumeration of cancer and immune cell types from bulk tumor gene expression data","volume":"6","author":"Racle","year":"2017","journal-title":"Elife"},{"key":"2024071000155438900_ref9","doi-asserted-by":"crossref","first-page":"135","DOI":"10.1007\/978-1-0716-0301-7_7","article-title":"Profiling cell type abundance and expression in bulk tissues with CIBERSORTx","volume":"2117","author":"Steen","year":"2020","journal-title":"Methods Mol Biol"},{"key":"2024071000155438900_ref10","doi-asserted-by":"crossref","first-page":"720","DOI":"10.1002\/msb.134947","article-title":"Digital cell quantification identifies global immune cell dynamics during influenza infection","volume":"10","author":"Altboum","year":"2014","journal-title":"Mol Syst Biol"},{"key":"2024071000155438900_ref11","doi-asserted-by":"crossref","DOI":"10.1371\/journal.pcbi.1008452","article-title":"Deconvolution of heterogeneous tumor samples using partial reference signals","volume":"16","author":"Qin","year":"2020","journal-title":"PLoS Comput Biol"},{"key":"2024071000155438900_ref12","doi-asserted-by":"crossref","DOI":"10.1371\/journal.pcbi.1007510","article-title":"CDSeq: a novel complete deconvolution method for dissecting heterogeneous samples using gene expression data","volume":"15","author":"Kang","year":"2019","journal-title":"PLoS Comput Biol"},{"key":"2024071000155438900_ref13","doi-asserted-by":"crossref","first-page":"453","DOI":"10.1038\/nmeth.3337","article-title":"Robust enumeration of cell subsets from tissue expression profiles","volume":"12","author":"Newman","year":"2015","journal-title":"Nat Methods"},{"key":"2024071000155438900_ref14","doi-asserted-by":"crossref","first-page":"505","DOI":"10.1038\/s43018-022-00356-3","article-title":"Cell type and gene expression deconvolution with BayesPrism enables Bayesian integrative analysis across bulk and single-cell RNA sequencing in oncology","volume":"3","author":"Chu","year":"2022","journal-title":"Nat Cancer"},{"key":"2024071000155438900_ref15","doi-asserted-by":"crossref","DOI":"10.1093\/bib\/bbaa358","article-title":"Progress and challenge for computational quantification of tissue immune cells","volume":"22","author":"Chen","year":"2021","journal-title":"Brief Bioinform"},{"key":"2024071000155438900_ref16","doi-asserted-by":"crossref","first-page":"R216","DOI":"10.1093\/hmg\/ddx275","article-title":"Cell-type deconvolution from DNA methylation: a review of recent applications","volume":"26","author":"Titus","year":"2017","journal-title":"Hum Mol Genet"},{"key":"2024071000155438900_ref17","doi-asserted-by":"crossref","first-page":"lqad111","DOI":"10.1093\/nargab\/lqad111","article-title":"Investigation of the usefulness of liver-specific deconvolution method by establishing a liver benchmark dataset","volume":"6","author":"Azuma","year":"2024","journal-title":"NAR Genom Bioinform"},{"key":"2024071000155438900_ref18","first-page":"993","article-title":"Latent dirichlet\u00a0allocation","volume":"3","author":"Blei","year":"2003","journal-title":"J Mach Learn Res"},{"key":"2024071000155438900_ref19","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3462478","article-title":"Topic modeling using latent Dirichlet\u00a0allocation","volume":"54","author":"Chauhan","year":"2022","journal-title":"ACM Comput Surv"},{"key":"2024071000155438900_ref20","doi-asserted-by":"crossref","first-page":"190","DOI":"10.1186\/s13059-023-03034-4","article-title":"GTM-decon: guided-topic modeling of single-cell transcriptomes enables sub-cell-type and disease-subtype deconvolution of bulk transcriptomes","volume":"24","author":"Swapna","year":"2023","journal-title":"Genome Biol"},{"key":"2024071000155438900_ref21","doi-asserted-by":"crossref","first-page":"5228","DOI":"10.1073\/pnas.0307752101","article-title":"Finding scientific topics","volume":"101","author":"Griffiths","year":"2004","journal-title":"Proc Natl Acad Sci"},{"key":"2024071000155438900_ref22","doi-asserted-by":"crossref","first-page":"224","DOI":"10.1177\/08944393231178605","article-title":"Seeded sequential LDA: a semi-supervised algorithm for topic-specific analysis of sentences","volume":"42","author":"Watanabe","year":"2023","journal-title":"Soc Sci Comput Rev"},{"key":"2024071000155438900_ref23","doi-asserted-by":"crossref","first-page":"465","DOI":"10.1177\/01655515211007724","article-title":"A guided latent Dirichlet\u00a0allocation approach to investigate real-time latent topics of twitter data during hurricane Laura","volume":"49","author":"Zhou","year":"2023","journal-title":"J Inf Sci"},{"key":"2024071000155438900_ref24","doi-asserted-by":"crossref","first-page":"25","DOI":"10.1038\/75556","article-title":"Gene ontology: tool for the unification of biology","volume":"25","author":"Ashburner","year":"2000","journal-title":"Nat Genet"},{"key":"2024071000155438900_ref25","doi-asserted-by":"crossref","first-page":"27","DOI":"10.1093\/nar\/28.1.27","article-title":"KEGG: Kyoto Encyclopedia of genes and genomes","volume":"28","author":"Kanehisa","year":"2000","journal-title":"Nucleic Acids Res"},{"key":"2024071000155438900_ref26","doi-asserted-by":"crossref","first-page":"380","DOI":"10.1038\/s41467-018-08023-x","article-title":"Bulk tissue cell type deconvolution with multi-subject single-cell expression reference","volume":"10","author":"Wang","year":"2019","journal-title":"Nat Commun"},{"key":"2024071000155438900_ref27","doi-asserted-by":"crossref","first-page":"346","DOI":"10.1016\/j.cels.2016.08.011","article-title":"A single-cell transcriptomic map of the human and mouse pancreas reveals inter- and intra-cell population structure","volume":"3","author":"Baron","year":"2016","journal-title":"Cell Syst"},{"key":"2024071000155438900_ref28","doi-asserted-by":"crossref","first-page":"34","DOI":"10.1186\/s13073-019-0638-6","article-title":"Molecular and pharmacological modulators of the tumor immune contexture revealed by deconvolution of RNA-seq data","volume":"11","author":"Finotello","year":"2019","journal-title":"Genome Med"},{"key":"2024071000155438900_ref29","doi-asserted-by":"crossref","DOI":"10.1371\/journal.pone.0109760","article-title":"Copy number loss of the interferon gene cluster in melanomas is linked to reduced T cell infiltrate and poor patient prognosis","volume":"9","author":"Linsley","year":"2014","journal-title":"PloS One"},{"key":"2024071000155438900_ref30","doi-asserted-by":"crossref","first-page":"1627","DOI":"10.1016\/j.celrep.2019.01.041","article-title":"RNA-Seq signatures normalized by mRNA abundance allow absolute deconvolution of human immune cell types","volume":"26","author":"Monaco","year":"2019","journal-title":"Cell Rep"},{"key":"2024071000155438900_ref31","doi-asserted-by":"crossref","DOI":"10.1371\/journal.pone.0152034","article-title":"System-wide associations between DNA-methylation, gene expression, and humoral immune response to influenza vaccination","volume":"11","author":"Zimmermann","year":"2016","journal-title":"PloS One"},{"key":"2024071000155438900_ref32","doi-asserted-by":"crossref","first-page":"D870","DOI":"10.1093\/nar\/gkac947","article-title":"CellMarker 2.0: an updated database of manually curated cell markers in human\/mouse and web tools based on scRNA-seq data","volume":"51","author":"Hu","year":"2023","journal-title":"Nucleic Acids Res"},{"key":"2024071000155438900_ref33","doi-asserted-by":"crossref","DOI":"10.1093\/database\/baz046","article-title":"PanglaoDB: a web server for exploration of mouse and human single-cell RNA sequencing data","volume":"2019","author":"Franz\u00e9n","year":"2019","journal-title":"Database"},{"key":"2024071000155438900_ref34","doi-asserted-by":"crossref","first-page":"D921","DOI":"10.1093\/nar\/gku955","article-title":"Open TG-GATEs: a large-scale toxicogenomics database","volume":"43","author":"Igarashi","year":"2015","journal-title":"Nucleic Acids Res"},{"key":"2024071000155438900_ref35","article-title":"Rat deconvolution as knowledge miner for immune cell trafficking from toxicogenomics databases","volume":"197","author":"Morita","year":"2023","journal-title":"Toxicol Sci"},{"key":"2024071000155438900_ref36","doi-asserted-by":"crossref","first-page":"855","DOI":"10.4049\/immunohorizons.2100088","article-title":"Type I IFN\u2013driven immune cell dysregulation in rat autoimmune diabetes","volume":"5","author":"Qaisar","year":"2021","journal-title":"Immunohorizons"},{"key":"2024071000155438900_ref37","doi-asserted-by":"crossref","first-page":"374","DOI":"10.1016\/j.ccell.2023.02.016","article-title":"The evolving tumor microenvironment: from cancer initiation to metastatic outgrowth","volume":"41","author":"Visser","year":"2023","journal-title":"Cancer Cell"},{"key":"2024071000155438900_ref38","doi-asserted-by":"crossref","first-page":"1113","DOI":"10.1038\/ng.2764","article-title":"The cancer genome atlas pan-cancer analysis project","volume":"45","author":"Weinstein","year":"2013","journal-title":"Nat Genet"},{"key":"2024071000155438900_ref39","doi-asserted-by":"crossref","first-page":"690","DOI":"10.1016\/j.ccell.2018.03.014","article-title":"A comprehensive pan-cancer molecular study of gynecologic and breast cancers","volume":"33","author":"Berger","year":"2018","journal-title":"Cancer Cell"},{"key":"2024071000155438900_ref40","doi-asserted-by":"crossref","first-page":"607","DOI":"10.1038\/ng.3564","article-title":"Distinct patterns of somatic genome alterations in lung adenocarcinomas and squamous cell carcinomas","volume":"48","author":"Campbell","year":"2016","journal-title":"Nat Genet"},{"key":"2024071000155438900_ref41","doi-asserted-by":"crossref","first-page":"1327","DOI":"10.1016\/j.cell.2017.05.046","article-title":"Comprehensive and integrative genomic characterization of hepatocellular carcinoma","volume":"169","author":"Ally","year":"2017","journal-title":"Cell"},{"key":"2024071000155438900_ref42","doi-asserted-by":"crossref","DOI":"10.1371\/journal.pone.0157368","article-title":"Refinement of triple-negative breast cancer molecular subtypes: implications for Neoadjuvant chemotherapy selection","volume":"11","author":"Lehmann","year":"2016","journal-title":"PloS One"},{"key":"2024071000155438900_ref43","doi-asserted-by":"crossref","first-page":"1098","DOI":"10.1186\/s12885-021-08805-5","article-title":"A novel gene expression signature-based on B-cell proportion to predict prognosis of patients with lung adenocarcinoma","volume":"21","author":"Zhang","year":"2021","journal-title":"BMC Cancer"},{"key":"2024071000155438900_ref44","first-page":"11","article-title":"KPNA2-associated immune analyses highlight the dysregulation and prognostic effects of GRB2, NRAS, and their RNA-binding proteins in hepatocellular carcinoma","volume":"11","author":"Zhang","year":"2020","journal-title":"Front Genet"},{"key":"2024071000155438900_ref45","first-page":"e1284723","article-title":"Assessment of tumor-infiltrating TCRV \u03b39V\u03b42\u03b3\u03b4 lymphocyte abundance by deconvolution of human cancers microarrays","volume":"6","author":"Tosolini","year":"2017","journal-title":"Onco Targets Ther"},{"key":"2024071000155438900_ref46","doi-asserted-by":"crossref","first-page":"12","DOI":"10.3389\/fimmu.2021.666137","article-title":"Construction and validation of an immune infiltration-related gene signature for the prediction of prognosis and therapeutic response in breast cancer","volume":"12","author":"Peng","year":"2021","journal-title":"Front Immunol"},{"key":"2024071000155438900_ref47","doi-asserted-by":"crossref","DOI":"10.1016\/j.infsof.2020.106411","article-title":"A systematic comparison of search-based approaches for LDA hyperparameter tuning","volume":"130","author":"Panichella","year":"2021","journal-title":"Inf Softw Technol"},{"key":"2024071000155438900_ref48","doi-asserted-by":"crossref","first-page":"5133","DOI":"10.1007\/s10462-022-10254-w","article-title":"Short text topic modelling approaches in the context of big data: taxonomy, survey, and analysis","volume":"56","author":"Murshed","year":"2023","journal-title":"Artif Intell Rev"},{"key":"2024071000155438900_ref49","doi-asserted-by":"crossref","DOI":"10.1016\/j.is.2020.101582","article-title":"A review of topic modeling methods","volume":"94","author":"Vayansky","year":"2020","journal-title":"Inf Syst"},{"key":"2024071000155438900_ref50","doi-asserted-by":"crossref","first-page":"2285","DOI":"10.1038\/s41467-020-16164-1","article-title":"Single-cell RNA sequencing demonstrates the molecular and cellular reprogramming of metastatic lung adenocarcinoma","volume":"11","author":"Kim","year":"2020","journal-title":"Nat Commun"},{"key":"2024071000155438900_ref51","doi-asserted-by":"crossref","first-page":"456","DOI":"10.1002\/hep.32609","article-title":"Eosinophils protect against acetaminophen-induced liver injury through cyclooxygenase-mediated IL-4\/IL-13 production","volume":"77","author":"Xu","year":"2023","journal-title":"Hepatology"}],"container-title":["Briefings in Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/academic.oup.com\/bib\/article-pdf\/25\/4\/bbae315\/58479724\/bbae315.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/bib\/article-pdf\/25\/4\/bbae315\/58479724\/bbae315.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,7,10]],"date-time":"2024-07-10T00:17:03Z","timestamp":1720570623000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/bib\/article\/doi\/10.1093\/bib\/bbae315\/7709575"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,5,23]]},"references-count":51,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2024,5,23]]}},"URL":"https:\/\/doi.org\/10.1093\/bib\/bbae315","relation":{},"ISSN":["1467-5463","1477-4054"],"issn-type":[{"value":"1467-5463","type":"print"},{"value":"1477-4054","type":"electronic"}],"subject":[],"published-other":{"date-parts":[[2024,7]]},"published":{"date-parts":[[2024,5,23]]},"article-number":"bbae315"}}