{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,4]],"date-time":"2026-05-04T04:14:28Z","timestamp":1777868068440,"version":"3.51.4"},"reference-count":43,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2026,4,30]],"date-time":"2026-04-30T00:00:00Z","timestamp":1777507200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2026,4,30]],"date-time":"2026-04-30T00:00:00Z","timestamp":1777507200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"funder":[{"DOI":"10.13039\/501100020771","name":"Young Scientists Fund of the National Natural Science Foundation of China","doi-asserted-by":"crossref","award":["62507006"],"award-info":[{"award-number":["62507006"]}],"id":[{"id":"10.13039\/501100020771","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Cogn Comput"],"published-print":{"date-parts":[[2026,12]]},"DOI":"10.1007\/s12559-026-10577-8","type":"journal-article","created":{"date-parts":[[2026,4,30]],"date-time":"2026-04-30T11:24:11Z","timestamp":1777548251000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["MixingInsights: A Framework for Causal Inference with Confounder Representation Learning from Mixed Structured and Textual Data"],"prefix":"10.1007","volume":"18","author":[{"given":"Lu","family":"Feng","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Adi","family":"Lin","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhiyong","family":"Luo","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2026,4,30]]},"reference":[{"key":"10577_CR1","doi-asserted-by":"crossref","unstructured":"Ai M, Li B, Gong H, Yu Q, Xue S, Zhang Y, et\u00a0al. LBCF: A Large-Scale Budget-Constrained Causal Forest Algorithm. In: Proceedings of the ACM Web Conference 2022; 2022. p. 2310\u20139.","DOI":"10.1145\/3485447.3512103"},{"key":"10577_CR2","doi-asserted-by":"publisher","first-page":"3359","DOI":"10.1145\/3442381.3449845","volume-title":"WWW\u201921: The Web Conference 2021","author":"Y Yuan","year":"2021","unstructured":"Yuan Y, Altenburger KM, Kooti F. Causal Network Motifs: Identifying Heterogeneous Spillover Effects in A\/B Tests. In: Leskovec J, Grobelnik M, Najork M, Tang J, Zia L, editors. WWW\u201921: The Web Conference 2021. Virtual Event \/ Ljubljana, Slovenia, April 19\u201323(2021); 2021. p. 3359\u201370."},{"key":"10577_CR3","doi-asserted-by":"publisher","first-page":"2291","DOI":"10.1145\/3442381.3449982","volume-title":"WWW\u201921: The Web Conference 2021","author":"Y Li","year":"2021","unstructured":"Li Y, Xie H, Lin Y, Lui JCS. Unifying Offline Causal Inference and Online Bandit Learning for Data Driven Decision. In: Leskovec J, Grobelnik M, Najork M, Tang J, Zia L, editors. WWW\u201921: The Web Conference 2021. Virtual Event \/ Ljubljana, Slovenia, April 19\u201323(2021); 2021. p. 2291\u2013303."},{"key":"10577_CR4","doi-asserted-by":"crossref","unstructured":"Chandar P, St\u00a0Thomas B, Maystre L, Pappu V, Sanchis-Ojeda R, Wu T, et\u00a0al. Using Survival Models to Estimate User Engagement in Online Experiments. In: Proceedings of the ACM Web Conference 2022; 2022. p. 3186\u201395.","DOI":"10.1145\/3485447.3512038"},{"key":"10577_CR5","doi-asserted-by":"publisher","first-page":"65","DOI":"10.1016\/j.jairtraman.2019.04.001","volume":"77","author":"E Sezgen","year":"2019","unstructured":"Sezgen E, Mason KJ, Mayer R. Voice of airline passenger: A text mining approach to understand customer satisfaction. J Air Trans Manag. 2019;77:65\u201374.","journal-title":"J Air Trans Manag"},{"key":"10577_CR6","doi-asserted-by":"crossref","unstructured":"Keith KA, Jensen D, O\u2019Connor B. Text and causal inference: A review of using text to remove confounding from causal estimates. In: Jurafsky D, Chai J, Schluter N, Tetreault JR, editors. Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, ACL 2020, Online, July 5-10, 2020; 2020. p. 5332\u201344.","DOI":"10.18653\/v1\/2020.acl-main.474"},{"key":"10577_CR7","doi-asserted-by":"crossref","unstructured":"Sridhar D, Getoor L. Estimating Causal Effects of Tone in Online Debates. In: Kraus S, editor. Proceedings of the Twenty-Eighth International Joint Conference on Artificial Intelligence, IJCAI 2019, Macao, China, August 10-16, 2019; 2019. p. 1872\u201378.","DOI":"10.24963\/ijcai.2019\/259"},{"key":"10577_CR8","doi-asserted-by":"crossref","unstructured":"Saha K, Sugar B, Torous J, Abrahao B, K\u0131c\u0131man E, De\u00a0Choudhury M. A social media study on the effects of psychiatric medication use. In: Proceedings of the International AAAI Conference on Web and Social Media. vol.\u00a013; 2019. p. 440\u201351.","DOI":"10.1609\/icwsm.v13i01.3242"},{"key":"10577_CR9","first-page":"135983","volume-title":"Advances in Neural Information Processing Systems","author":"JM Chen","year":"2024","unstructured":"Chen JM, Bhattacharya R, Keith KA, et al. Proximal Causal Inference With Text Data. In: Globerson A, Mackey L, Belgrave D, Fan A, Paquet U, Tomczak J, et al., editors. Advances in Neural Information Processing Systems, vol. 37. Curran Associates: Inc; 2024. p. 135983\u20136017."},{"key":"10577_CR10","doi-asserted-by":"crossref","unstructured":"De\u00a0Choudhury M, Kiciman E, Dredze M, Coppersmith G, Kumar M. Discovering shifts to suicidal ideation from mental health content in social media. In: Proceedings of the 2016 CHI conference on human factors in computing systems; 2016. p. 2098\u2013110.","DOI":"10.1145\/2858036.2858207"},{"key":"10577_CR11","doi-asserted-by":"crossref","unstructured":"De\u00a0Choudhury M, Kiciman E. The language of social support in social media and its effect on suicidal ideation risk. In: Proceedings of the International AAAI Conference on Web and Social Media. vol.\u00a011; 2017. Issue: 1.","DOI":"10.1609\/icwsm.v11i1.14891"},{"key":"10577_CR12","unstructured":"Johansson F, Shalit U, Sontag D. Learning representations for counterfactual inference. In: International conference on machine learning; 2016. p. 3020\u20139."},{"key":"10577_CR13","doi-asserted-by":"crossref","unstructured":"Kiciman E, Counts S, Gasser M. Using longitudinal social media analysis to understand the effects of early college alcohol use. In: Twelfth International AAAI Conference on Web and Social Media; 2018.","DOI":"10.1609\/icwsm.v12i1.15012"},{"key":"10577_CR14","doi-asserted-by":"crossref","unstructured":"Mozer R, Miratrix L, Kaufman AR, Anastasopoulos LJ. Matching with Text Data: An Experimental Evaluation of Methods for Matching Documents and of Measuring Match Quality. Polit Anal. 2020;28(4):445\u201368. https:\/\/www.jstor.org\/stable\/27116032.","DOI":"10.1017\/pan.2020.1"},{"key":"10577_CR15","doi-asserted-by":"crossref","unstructured":"Olteanu A, Varol O, Kiciman E. Distilling the Outcomes of Personal Experiences: A Propensity-scored Analysis of Social Media. In: Lee CP, Poltrock SE, Barkhuus L, Borges M, Kellogg WA, editors. Proceedings of the 2017 ACM Conference on Computer Supported Cooperative Work and Social Computing, CSCW 2017, Portland, OR, USA, February 25 - March 1, 2017; 2017. p. 370\u201386.","DOI":"10.1145\/2998181.2998353"},{"key":"10577_CR16","unstructured":"Sridhar D, Springer A, Hollis V, Whittaker S, Getoor L. Estimating causal effects of exercise from mood logging data. In: IJCAI\/ICML Workshop on CausalML; 2018."},{"key":"10577_CR17","doi-asserted-by":"crossref","unstructured":"Wang Z, Culotta A. When Do Words Matter? Understanding the Impact of Lexical Choice on Audience Perception Using Individual Treatment Effect Estimation. In: The Thirty-Third AAAI Conference on Artificial Intelligence, AAAI 2019, The Thirty-First Innovative Applications of Artificial Intelligence Conference, IAAI 2019, The Ninth AAAI Symposium on Educational Advances in Artificial Intelligence, EAAI 2019, Honolulu, Hawaii, USA, January 27 - February 1, 2019; 2019. p. 7233\u201340.","DOI":"10.1609\/aaai.v33i01.33017233"},{"key":"10577_CR18","doi-asserted-by":"crossref","unstructured":"Falavarjani SM, Hosseini H, Noorian Z, Bagheri E. Estimating the effect of exercising on users\u2019 online behavior. In: Proceedings of the International AAAI Conference on Web and Social Media. vol.\u00a011; 2017. Issue: 1.","DOI":"10.1609\/icwsm.v11i1.14975"},{"issue":"4","key":"10577_CR19","doi-asserted-by":"publisher","first-page":"887","DOI":"10.1111\/ajps.12526","volume":"64","author":"ME Roberts","year":"2020","unstructured":"Roberts ME, Stewart BM, Nielsen RA. Adjusting for confounding with text matching. Am J Polit Sci. 2020;64(4):887\u2013903.","journal-title":"Am J Polit Sci"},{"issue":"4","key":"10577_CR20","doi-asserted-by":"publisher","first-page":"1064","DOI":"10.1111\/ajps.12103","volume":"58","author":"ME Roberts","year":"2014","unstructured":"Roberts ME, Stewart BM, Tingley D, Lucas C, Leder-Luis J, Gadarian SK, et al. Structural models for open-ended survey responses. Am J Polit Sci. 2014;58(4):1064\u201382.","journal-title":"Am J Polit Sci"},{"key":"10577_CR21","doi-asserted-by":"crossref","unstructured":"Pennington J, Socher R, Manning C. GloVe: Global Vectors for Word Representation. In: Moschitti A, Pang B, Daelemans W, editors. Proceedings of the 2014 Conference on Empirical Methods in Natural Language Processing (EMNLP). Doha, Qatar: Association for Computational Linguistics; 2014. p. 1532\u201343. Available from: https:\/\/aclanthology.org\/D14-1162\/.","DOI":"10.3115\/v1\/D14-1162"},{"key":"10577_CR22","doi-asserted-by":"crossref","unstructured":"Wu Y, Kuang K, Zhang Y, Liu X, Sun C, Xiao J, et\u00a0al. De-biased court\u2019s view generation with causality. In: Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP); 2020. p. 763\u201380.","DOI":"10.18653\/v1\/2020.emnlp-main.56"},{"key":"10577_CR23","doi-asserted-by":"crossref","unstructured":"Pryzant R, Card D, Jurafsky D, Veitch V, Sridhar D. Causal Effects of Linguistic Properties. In: Proceedings of the 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies; 2021. p. 4095\u2013109.","DOI":"10.18653\/v1\/2021.naacl-main.323"},{"key":"10577_CR24","unstructured":"Veitch V, Sridhar D, Blei D. Adapting text embeddings for causal inference. In: Conference on Uncertainty in Artificial Intelligence; 2020. p. 919\u201328."},{"key":"10577_CR25","doi-asserted-by":"crossref","unstructured":"Weld G, West P, Glenski M, Arbour D, Rossi RA, Althoff T. Adjusting for Confounders with Text: Challenges and an Empirical Evaluation Framework for Causal Inference. Proc Int AAAI Conf Web Soc Media. 2022;16:1109\u201320. https:\/\/ojs.aaai.org\/index.php\/ICWSM\/article\/view\/19362.","DOI":"10.1609\/icwsm.v16i1.19362"},{"key":"10577_CR26","doi-asserted-by":"publisher","first-page":"150010","DOI":"10.1109\/ACCESS.2025.3598276","volume":"13","author":"H Sharma","year":"2025","unstructured":"Sharma H, Kaur S. Causal representation learning for predicting autoimmune disease progression from longitudinal multimodal clinical data. IEEE Access. 2025;13:150010\u201327.","journal-title":"IEEE Access."},{"key":"10577_CR27","doi-asserted-by":"publisher","first-page":"0467","DOI":"10.34133\/research.0467","volume":"7","author":"L Jiao","year":"2024","unstructured":"Jiao L, Wang Y, Liu X, Li L, Liu F, Ma W, et al. Causal inference meets deep learning: A comprehensive survey. Research. 2024;7:0467.","journal-title":"Research"},{"key":"10577_CR28","unstructured":"Parikh H, Varjao C, Xu L, Tchetgen ET. Validating Causal Inference Methods. In: Chaudhuri K, Jegelka S, Song L, Szepesvari C, Niu G, Sabato S, editors, Proceedings of the 39th International Conference on Machine Learning. vol. 162 of Proceedings of Machine Learning Research. PMLR; 2022. p. 17346\u201358. https:\/\/proceedings.mlr.press\/v162\/parikh22a.html."},{"issue":"5","key":"10577_CR29","doi-asserted-by":"publisher","first-page":"688","DOI":"10.1037\/h0037350","volume":"66","author":"DB Rubin","year":"1974","unstructured":"Rubin DB. Estimating causal effects of treatments in randomized and nonrandomized studies. J Educ Psychol. 1974;66(5):688.","journal-title":"J Educ Psychol"},{"issue":"396","key":"10577_CR30","doi-asserted-by":"publisher","first-page":"945","DOI":"10.1080\/01621459.1986.10478354","volume":"81","author":"PW Holland","year":"1986","unstructured":"Holland PW. Statistics and causal inference. J Am Stat Assoc. 1986;81(396):945\u201360.","journal-title":"J Am Stat Assoc"},{"issue":"9\u201312","key":"10577_CR31","doi-asserted-by":"publisher","first-page":"1393","DOI":"10.1016\/0270-0255(86)90088-6","volume":"7","author":"J Robins","year":"1986","unstructured":"Robins J. A new approach to causal inference in mortality studies with a sustained exposure period - application to control of the healthy worker survivor effect. Math Model. 1986;7(9\u201312):1393\u2013512.","journal-title":"Math Model"},{"issue":"1","key":"10577_CR32","doi-asserted-by":"publisher","first-page":"41","DOI":"10.1093\/biomet\/70.1.41","volume":"70","author":"PR Rosenbaum","year":"1983","unstructured":"Rosenbaum PR, Rubin DB. The central role of the propensity score in observational studies for causal effects. Biometrika. 1983;70(1):41\u201355.","journal-title":"Biometrika"},{"issue":"5","key":"10577_CR33","first-page":"335","volume":"38","author":"S Narduzzi","year":"2014","unstructured":"Narduzzi S, Golini MN, Porta D, Stafoggia M, Forastiere F. Inverse probability weighting (IPW) for evaluating and \u201ccorrecting\u2019\u2019 selection bias. Epidemiologia & Prevenzione. 2014;38(5):335\u201341.","journal-title":"Epidemiologia & Prevenzione."},{"issue":"4","key":"10577_CR34","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1001\/jamanetworkopen.2023.7597","volume":"6","author":"M Lu","year":"2023","unstructured":"Lu M, Zhang Y, Zhang J, Huang S, Huang F, Wang T, et al. Comparative effectiveness of digital cognitive behavioral therapy vs medication therapy among patients with insomnia. JAMA Netw Open. 2023;6(4):1\u201316.","journal-title":"JAMA Netw Open"},{"key":"10577_CR35","doi-asserted-by":"publisher","first-page":"529","DOI":"10.1162\/tacl_a_00078","volume":"5","author":"RJ Gallagher","year":"2017","unstructured":"Gallagher RJ, Reing K, Kale D, Ver Steeg G. Anchored correlation explanation: Topic modeling with minimal domain knowledge. Trans Assoc Comput Linguist. 2017;5:529\u201342.","journal-title":"Trans Assoc Comput Linguist"},{"key":"10577_CR36","unstructured":"Pennebaker JW, Booth RJ, Francis ME. Linguistic Inquiry and Word Count: LIWC2007; 2007."},{"key":"10577_CR37","unstructured":"Kenton JDMWC, Toutanova LK. BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding. In: Proceedings of NAACL-HLT; 2019. p. 4171\u201386."},{"key":"10577_CR38","unstructured":"Loshchilov I, Hutter F. Decoupled Weight Decay Regularization. In: International Conference on Learning Representations; 2018."},{"key":"10577_CR39","doi-asserted-by":"crossref","unstructured":"Wolf T, Debut L, Sanh V, Chaumond J, Delangue C, Moi A, et\u00a0al. Transformers: State-of-the-Art Natural Language Processing. In: Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing: System Demonstrations. Online: Association for Computational Linguistics; 2020. p. 38\u201345. Available from: https:\/\/www.aclweb.org\/anthology\/2020.emnlp-demos.6.","DOI":"10.18653\/v1\/2020.emnlp-demos.6"},{"key":"10577_CR40","doi-asserted-by":"publisher","first-page":"257","DOI":"10.1016\/j.ins.2019.09.013","volume":"509","author":"R Campos","year":"2020","unstructured":"Campos R, Mangaravite V, Pasquali A, Jorge A, Nunes C, Jatowt A. YAKE! Keyword extraction from single documents using multiple local features. Inf Sci. 2020;509:257\u201389.","journal-title":"Inf Sci"},{"key":"10577_CR41","first-page":"993","volume":"3","author":"DM Blei","year":"2003","unstructured":"Blei DM, Ng A, Jordan MI. Latent dirichlet allocation. J Mach Learn Res. 2003;3:993\u20131022.","journal-title":"J Mach Learn Res."},{"issue":"429","key":"10577_CR42","doi-asserted-by":"publisher","first-page":"122","DOI":"10.1080\/01621459.1995.10476494","volume":"90","author":"JM Robins","year":"1995","unstructured":"Robins JM, Rotnitzky A. Semiparametric efficiency in multivariate regression models with missing data. J Am Stat Assoc. 1995;90(429):122\u20139.","journal-title":"J Am Stat Assoc"},{"issue":"6324","key":"10577_CR43","doi-asserted-by":"publisher","first-page":"483","DOI":"10.1126\/science.aal4321","volume":"355","author":"S Athey","year":"2017","unstructured":"Athey S. Beyond prediction: Using big data for policy problems. Science. 2017;355(6324):483\u20135.","journal-title":"Science."}],"container-title":["Cognitive Computation"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s12559-026-10577-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s12559-026-10577-8","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s12559-026-10577-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,30]],"date-time":"2026-04-30T11:24:22Z","timestamp":1777548262000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s12559-026-10577-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,4,30]]},"references-count":43,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2026,12]]}},"alternative-id":["10577"],"URL":"https:\/\/doi.org\/10.1007\/s12559-026-10577-8","relation":{},"ISSN":["1866-9956","1866-9964"],"issn-type":[{"value":"1866-9956","type":"print"},{"value":"1866-9964","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,4,30]]},"assertion":[{"value":"12 January 2026","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"8 April 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"30 April 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"40"}}