{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,21]],"date-time":"2025-08-21T16:49:15Z","timestamp":1755794955732,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":60,"publisher":"ACM","license":[{"start":{"date-parts":[[2025,7,20]],"date-time":"2025-07-20T00:00:00Z","timestamp":1752969600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"DOI":"10.13039\/https:\/\/doi.org\/10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62372116, 62472415"],"award-info":[{"award-number":["62372116, 62472415"]}],"id":[{"id":"10.13039\/https:\/\/doi.org\/10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/https:\/\/doi.org\/10.13039\/501100012166","name":"National Key Research and Development Program of China","doi-asserted-by":"publisher","award":["2021YFC3340302, 2021YFC3300304"],"award-info":[{"award-number":["2021YFC3340302, 2021YFC3300304"]}],"id":[{"id":"10.13039\/https:\/\/doi.org\/10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,7,20]]},"DOI":"10.1145\/3690624.3709338","type":"proceedings-article","created":{"date-parts":[[2025,4,4]],"date-time":"2025-04-04T18:48:32Z","timestamp":1743792512000},"page":"1197-1208","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Fast Causal Discovery by Approximate Kernel-based Generalized Score Functions with Linear Computational Complexity"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-0084-4903","authenticated-orcid":false,"given":"Yixin","family":"Ren","sequence":"first","affiliation":[{"name":"Fudan University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-1058-1734","authenticated-orcid":false,"given":"Haocheng","family":"Zhang","sequence":"additional","affiliation":[{"name":"Fudan University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5515-5913","authenticated-orcid":false,"given":"Yewei","family":"Xia","sequence":"additional","affiliation":[{"name":"Fudan University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5544-5347","authenticated-orcid":false,"given":"Hao","family":"Zhang","sequence":"additional","affiliation":[{"name":"SIAT, Chinese Academy of Sciences, Shenzhen, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2313-7635","authenticated-orcid":false,"given":"Jihong","family":"Guan","sequence":"additional","affiliation":[{"name":"Tongji University, Shanghai, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1949-2768","authenticated-orcid":false,"given":"Shuigeng","family":"Zhou","sequence":"additional","affiliation":[{"name":"Fudan University, Shanghai, China"}]}],"member":"320","published-online":{"date-parts":[[2025,7,20]]},"reference":[{"key":"e_1_3_2_2_1_1","volume-title":"Advances in Neural Information Processing Systems","volume":"15","author":"Bach Francis","year":"2002","unstructured":"Francis Bach and Michael Jordan. 2002 a. Learning graphical models with Mercer kernels. Advances in Neural Information Processing Systems, Vol. 15 (2002)."},{"key":"e_1_3_2_2_2_1","first-page":"1","article-title":"b. Kernel independent component analysis","volume":"3","author":"Bach Francis R","year":"2002","unstructured":"Francis R Bach and Michael I Jordan. 2002 b. Kernel independent component analysis. Journal of Machine Learning Research, Vol. 3, Jul (2002), 1--48.","journal-title":"Journal of Machine Learning Research"},{"key":"e_1_3_2_2_3_1","volume-title":"DAGMA: Learning DAGs via M-matrices and a Log-Determinant Acyclicity Characterization. In Advances in Neural Information Processing Systems","author":"Bello Kevin","year":"2022","unstructured":"Kevin Bello, Bryon Aragam, and Pradeep Ravikumar. 2022. DAGMA: Learning DAGs via M-matrices and a Log-Determinant Acyclicity Characterization. In Advances in Neural Information Processing Systems, S. Koyejo, S. Mohamed, A. Agarwal, D. Belgrave, K. Cho, and A. Oh (Eds.), Vol. 35. Curran Associates, Inc., 8226--8239. https:\/\/proceedings.neurips.cc\/paper_files\/paper\/2022\/file\/36e2967f87c3362e37cf988781a887ad-Paper-Conference.pdf"},{"key":"e_1_3_2_2_4_1","doi-asserted-by":"publisher","DOI":"10.1214\/14-AOS1260"},{"key":"e_1_3_2_2_5_1","doi-asserted-by":"publisher","DOI":"10.1016\/B978-1-55860-203-8.50010-3"},{"key":"e_1_3_2_2_6_1","first-page":"507","article-title":"Optimal structure identification with greedy search","volume":"3","author":"Chickering David Maxwell","year":"2002","unstructured":"David Maxwell Chickering. 2002. Optimal structure identification with greedy search. Journal of Machine Learning Research, Vol. 3, Nov (2002), 507--554.","journal-title":"Journal of Machine Learning Research"},{"key":"e_1_3_2_2_7_1","volume-title":"Conference on Uncertainty in Artificial Intelligence. Pmlr, 241--249","author":"Chickering Max","year":"2020","unstructured":"Max Chickering. 2020. Statistically efficient greedy equivalence search. In Conference on Uncertainty in Artificial Intelligence. Pmlr, 241--249."},{"key":"e_1_3_2_2_8_1","doi-asserted-by":"publisher","DOI":"10.1007\/11503415_22"},{"key":"e_1_3_2_2_9_1","doi-asserted-by":"publisher","DOI":"10.5555\/1005332.1005335"},{"key":"e_1_3_2_2_10_1","volume-title":"Advances in Neural Information Processing Systems","volume":"21","author":"Fukumizu Kenji","year":"2008","unstructured":"Kenji Fukumizu, Arthur Gretton, Bernhard Sch\u00f6lkopf, and Bharath K Sriperumbudur. 2008. Characteristic kernels on groups and semigroups. Advances in Neural Information Processing Systems, Vol. 21 (2008)."},{"key":"e_1_3_2_2_11_1","volume-title":"Advances in Neural Information Processing Systems","volume":"20","author":"Fukumizu Kenji","year":"2007","unstructured":"Kenji Fukumizu, Arthur Gretton, Xiaohai Sun, and Bernhard Sch\u00f6lkopf. 2007. Kernel measures of conditional dependence. Advances in Neural Information Processing Systems, Vol. 20 (2007)."},{"key":"e_1_3_2_2_12_1","volume-title":"Advances in Neural Information Processing Systems","volume":"31","author":"Gardner Jacob","year":"2018","unstructured":"Jacob Gardner, Geoff Pleiss, Kilian Q Weinberger, David Bindel, and Andrew G Wilson. 2018. Gpytorch: Blackbox matrix-matrix gaussian process inference with gpu acceleration. Advances in Neural Information Processing Systems, Vol. 31 (2018)."},{"volume-title":"Uncertainty in Artificial Intelligence","author":"Geiger Dan","key":"e_1_3_2_2_13_1","unstructured":"Dan Geiger and David Heckerman. 1994. Learning gaussian networks. In Uncertainty in Artificial Intelligence. Elsevier, 235--243."},{"key":"e_1_3_2_2_14_1","doi-asserted-by":"publisher","DOI":"10.1023\/A:1022623210503"},{"key":"e_1_3_2_2_15_1","doi-asserted-by":"publisher","DOI":"10.1145\/3219819.3220104"},{"key":"e_1_3_2_2_16_1","doi-asserted-by":"publisher","DOI":"10.5555\/2567709.2502585"},{"key":"e_1_3_2_2_17_1","first-page":"981","article-title":"Sampling methods for the Nystr\u00f6m method","volume":"13","author":"Kumar Sanjiv","year":"2012","unstructured":"Sanjiv Kumar, Mehryar Mohri, and Ameet Talwalkar. 2012. Sampling methods for the Nystr\u00f6m method. The Journal of Machine Learning Research, Vol. 13, 1 (2012), 981--1006.","journal-title":"The Journal of Machine Learning Research"},{"key":"e_1_3_2_2_18_1","volume-title":"Gradient-based neural dag learning. arXiv preprint arXiv:1906.02226","author":"Lachapelle S\u00e9bastien","year":"2019","unstructured":"S\u00e9bastien Lachapelle, Philippe Brouillard, Tristan Deleu, and Simon Lacoste-Julien. 2019. Gradient-based neural dag learning. arXiv preprint arXiv:1906.02226 (2019)."},{"key":"e_1_3_2_2_19_1","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2019.2957109"},{"key":"e_1_3_2_2_20_1","first-page":"17943","article-title":"On the role of sparsity and dag constraints for learning linear dags","volume":"33","author":"Ng Ignavier","year":"2020","unstructured":"Ignavier Ng, AmirEmad Ghassami, and Kun Zhang. 2020. On the role of sparsity and dag constraints for learning linear dags. Advances in Neural Information Processing Systems, Vol. 33 (2020), 17943--17954.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_2_21_1","unstructured":"Ignavier Ng Biwei Huang and Kun Zhang. 2024. Structure learning with continuous optimization: A sober look and beyond. In Causal Learning and Reasoning. PMLR 71--105."},{"key":"e_1_3_2_2_22_1","volume-title":"Theoretical impediments to machine learning with seven sparks from the causal revolution. arXiv preprint arXiv:1801.04016","author":"Pearl Judea","year":"2018","unstructured":"Judea Pearl. 2018. Theoretical impediments to machine learning with seven sparks from the causal revolution. arXiv preprint arXiv:1801.04016 (2018)."},{"key":"e_1_3_2_2_23_1","unstructured":"Judea Pearl and Dana Mackenzie. 2018. The book of why: the new science of cause and effect. Basic books."},{"key":"e_1_3_2_2_24_1","volume-title":"Advances in Neural Information Processing Systems","volume":"20","author":"Rahimi Ali","year":"2007","unstructured":"Ali Rahimi and Benjamin Recht. 2007. Random features for large-scale kernel machines. Advances in Neural Information Processing Systems, Vol. 20 (2007)."},{"key":"e_1_3_2_2_25_1","doi-asserted-by":"publisher","DOI":"10.1007\/s41060-016-0032-z"},{"key":"e_1_3_2_2_26_1","volume-title":"Efficiently Learning Significant Fourier Feature Pairs for Statistical Independence Testing. In The Thirty-eighth Annual Conference on Neural Information Processing Systems.","author":"Ren Yixin","year":"2024","unstructured":"Yixin Ren, Yewei Xia, Hao Zhang, Jihong Guan, and Shuigeng Zhou. 2024a. Efficiently Learning Significant Fourier Feature Pairs for Statistical Independence Testing. In The Thirty-eighth Annual Conference on Neural Information Processing Systems."},{"key":"e_1_3_2_2_27_1","volume-title":"Learning Adaptive Kernels for Statistical Independence Tests. In International Conference on Artificial Intelligence and Statistics. PMLR, 2494--2502","author":"Ren Yixin","year":"2024","unstructured":"Yixin Ren, Yewei Xia, Hao Zhang, Jihong Guan, and Shuigeng Zhou. 2024b. Learning Adaptive Kernels for Statistical Independence Tests. In International Conference on Artificial Intelligence and Statistics. PMLR, 2494--2502."},{"key":"e_1_3_2_2_28_1","volume-title":"International Conference on Machine Learning. PMLR","author":"Rolland Paul","year":"2022","unstructured":"Paul Rolland, Volkan Cevher, Matth\u00e4us Kleindessner, Chris Russell, Dominik Janzing, Bernhard Sch\u00f6lkopf, and Francesco Locatello. 2022. Score matching enables causal discovery of nonlinear additive noise models. In International Conference on Machine Learning. PMLR, 18741--18753."},{"key":"e_1_3_2_2_29_1","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2021.3058954"},{"volume-title":"Learning with kernels: support vector machines, regularization, optimization, and beyond","author":"Sch\u00f6lkopf Bernhard","key":"e_1_3_2_2_30_1","unstructured":"Bernhard Sch\u00f6lkopf and Alexander J Smola. 2002. Learning with kernels: support vector machines, regularization, optimization, and beyond. MIT press."},{"key":"e_1_3_2_2_31_1","volume-title":"Estimating the dimension of a model. The Annals of Statistics","author":"Schwarz Gideon","year":"1978","unstructured":"Gideon Schwarz. 1978. Estimating the dimension of a model. The Annals of Statistics (1978), 461--464."},{"key":"e_1_3_2_2_32_1","first-page":"1","article-title":"Memory efficient kernel approximation","volume":"18","author":"Si Si","year":"2017","unstructured":"Si Si, Cho-Jui Hsieh, and Inderjit S Dhillon. 2017. Memory efficient kernel approximation. Journal of Machine Learning Research, Vol. 18, 20 (2017), 1--32.","journal-title":"Journal of Machine Learning Research"},{"key":"e_1_3_2_2_33_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-11433-0_29"},{"volume-title":"prediction, and search","author":"Spirtes Peter","key":"e_1_3_2_2_34_1","unstructured":"Peter Spirtes, Clark Glymour, and Richard Scheines. 2001. Causation, prediction, and search. MIT press."},{"volume-title":"Applied Informatics","author":"Spirtes Peter","key":"e_1_3_2_2_35_1","unstructured":"Peter Spirtes and Kun Zhang. 2016. Causal discovery and inference: concepts and recent methodological advances. In Applied Informatics, Vol. 3. Springer, 1--28."},{"key":"e_1_3_2_2_36_1","doi-asserted-by":"publisher","DOI":"10.5555\/1756006.1859901"},{"key":"e_1_3_2_2_37_1","doi-asserted-by":"publisher","DOI":"10.1515\/jci-2018-0017"},{"key":"e_1_3_2_2_38_1","volume-title":"Nts-notears: Learning nonparametric dbns with prior knowledge. arXiv preprint arXiv:2109.04286","author":"Sun Xiangyu","year":"2021","unstructured":"Xiangyu Sun, Oliver Schulte, Guiliang Liu, and Pascal Poupart. 2021. Nts-notears: Learning nonparametric dbns with prior knowledge. arXiv preprint arXiv:2109.04286 (2021)."},{"key":"e_1_3_2_2_39_1","doi-asserted-by":"publisher","DOI":"10.1145\/956750.956838"},{"key":"e_1_3_2_2_40_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10994-006-6889-7"},{"key":"e_1_3_2_2_41_1","doi-asserted-by":"publisher","DOI":"10.1145\/3527154"},{"key":"e_1_3_2_2_42_1","first-page":"2574","article-title":"A survey on large-scale machine learning","volume":"34","author":"Wang Meng","year":"2020","unstructured":"Meng Wang, Weijie Fu, Xiangnan He, Shijie Hao, and Xindong Wu. 2020. A survey on large-scale machine learning. IEEE Transactions on Knowledge and Data Engineering, Vol. 34, 6 (2020), 2574--2594.","journal-title":"IEEE Transactions on Knowledge and Data Engineering"},{"key":"e_1_3_2_2_43_1","volume-title":"Optimal Kernel Choice for Score Function-based Causal Discovery. In Forty-first International Conference on Machine Learning.","author":"Wang Wenjie","year":"2024","unstructured":"Wenjie Wang, Biwei Huang, Feng Liu, Xinge You, Tongliang Liu, Kun Zhang, and Mingming Gong. 2024. Optimal Kernel Choice for Score Function-based Causal Discovery. In Forty-first International Conference on Machine Learning."},{"key":"e_1_3_2_2_44_1","first-page":"3895","article-title":"DAGs with No Fears: A closer look at continuous optimization for learning Bayesian networks","volume":"33","author":"Wei Dennis","year":"2020","unstructured":"Dennis Wei, Tian Gao, and Yue Yu. 2020. DAGs with No Fears: A closer look at continuous optimization for learning Bayesian networks. Advances in Neural Information Processing Systems, Vol. 33 (2020), 3895--3906.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_2_45_1","volume-title":"Advances in Neural Information Processing Systems","volume":"8","author":"Williams Christopher","year":"1995","unstructured":"Christopher Williams and Carl Rasmussen. 1995. Gaussian processes for regression. Advances in Neural Information Processing Systems, Vol. 8 (1995)."},{"key":"e_1_3_2_2_46_1","volume-title":"Advances in Neural Information Processing Systems","volume":"13","author":"Williams Christopher","year":"2000","unstructured":"Christopher Williams and Matthias Seeger. 2000. Using the Nystr\u00f6m method to speed up kernel machines. Advances in Neural Information Processing Systems, Vol. 13 (2000)."},{"key":"e_1_3_2_2_47_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICDM58522.2023.00076"},{"key":"e_1_3_2_2_48_1","volume-title":"Advances in Neural Information Processing Systems","volume":"25","author":"Yang Tianbao","year":"2012","unstructured":"Tianbao Yang, Yu-Feng Li, Mehrdad Mahdavi, Rong Jin, and Zhi-Hua Zhou. 2012. Nystr\u00f6m method vs random fourier features: A theoretical and empirical comparison. Advances in Neural Information Processing Systems, Vol. 25 (2012)."},{"key":"e_1_3_2_2_49_1","volume-title":"International Conference on Machine Learning. PMLR, 7154--7163","author":"Yu Yue","year":"2019","unstructured":"Yue Yu, Jie Chen, Tian Gao, and Mo Yu. 2019. DAG-GNN: DAG structure learning with graph neural networks. In International Conference on Machine Learning. PMLR, 7154--7163."},{"key":"e_1_3_2_2_50_1","doi-asserted-by":"publisher","DOI":"10.5555\/2591248.2591250"},{"key":"e_1_3_2_2_51_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2024.3435503"},{"key":"e_1_3_2_2_52_1","volume-title":"Kernel-based conditional independence test and application in causal discovery. arXiv preprint arXiv:1202.3775","author":"Zhang Kun","year":"2012","unstructured":"Kun Zhang, Jonas Peters, Dominik Janzing, and Bernhard Sch\u00f6lkopf. 2012. Kernel-based conditional independence test and application in causal discovery. arXiv preprint arXiv:1202.3775 (2012)."},{"key":"e_1_3_2_2_53_1","doi-asserted-by":"publisher","DOI":"10.1093\/nsr\/nwx137"},{"key":"e_1_3_2_2_54_1","volume-title":"Causal representation learning from multiple distributions: A general setting. arXiv preprint arXiv:2402.05052","author":"Zhang Kun","year":"2024","unstructured":"Kun Zhang, Shaoan Xie, Ignavier Ng, and Yujia Zheng. 2024b. Causal representation learning from multiple distributions: A general setting. arXiv preprint arXiv:2402.05052 (2024)."},{"key":"e_1_3_2_2_55_1","doi-asserted-by":"publisher","DOI":"10.1007\/s11222-016-9721-7"},{"key":"e_1_3_2_2_56_1","first-page":"18390","article-title":"Truncated matrix power iteration for differentiable dag learning","volume":"35","author":"Zhang Zhen","year":"2022","unstructured":"Zhen Zhang, Ignavier Ng, Dong Gong, Yuhang Liu, Ehsan Abbasnejad, Mingming Gong, Kun Zhang, and Javen Qinfeng Shi. 2022. Truncated matrix power iteration for differentiable dag learning. Advances in Neural Information Processing Systems, Vol. 35 (2022), 18390--18402.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_2_57_1","volume-title":"Advances in Neural Information Processing Systems","volume":"31","author":"Zheng Xun","year":"2018","unstructured":"Xun Zheng, Bryon Aragam, Pradeep K Ravikumar, and Eric P Xing. 2018a. Dags with no tears: Continuous optimization for structure learning. Advances in Neural Information Processing Systems, Vol. 31 (2018)."},{"key":"e_1_3_2_2_58_1","volume-title":"Garnett (Eds.)","volume":"31","author":"Zheng Xun","year":"2018","unstructured":"Xun Zheng, Bryon Aragam, Pradeep K Ravikumar, and Eric P Xing. 2018b. DAGs with NO TEARS: Continuous Optimization for Structure Learning. In Advances in Neural Information Processing Systems, S. Bengio, H. Wallach, H. Larochelle, K. Grauman, N. Cesa-Bianchi, and R. Garnett (Eds.), Vol. 31. Curran Associates, Inc. https:\/\/proceedings.neurips.cc\/paper_files\/paper\/2018\/file\/e347c51419ffb23ca3fd5050202f9c3d-Paper.pdf"},{"key":"e_1_3_2_2_59_1","volume-title":"International Conference on Artificial Intelligence and Statistics. Pmlr, 3414--3425","author":"Zheng Xun","year":"2020","unstructured":"Xun Zheng, Chen Dan, Bryon Aragam, Pradeep Ravikumar, and Eric Xing. 2020. Learning sparse nonparametric dags. In International Conference on Artificial Intelligence and Statistics. Pmlr, 3414--3425."},{"key":"e_1_3_2_2_60_1","first-page":"1","article-title":"Causal-learn: Causal discovery in python","volume":"25","author":"Zheng Yujia","year":"2024","unstructured":"Yujia Zheng, Biwei Huang, Wei Chen, Joseph Ramsey, Mingming Gong, Ruichu Cai, Shohei Shimizu, Peter Spirtes, and Kun Zhang. 2024. Causal-learn: Causal discovery in python. Journal of Machine Learning Research, Vol. 25, 60 (2024), 1--8.","journal-title":"Journal of Machine Learning Research"}],"event":{"name":"KDD '25: The 31st ACM SIGKDD Conference on Knowledge Discovery and Data Mining","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGKDD ACM Special Interest Group on Knowledge Discovery in Data"],"location":"Toronto ON Canada","acronym":"KDD '25"},"container-title":["Proceedings of the 31st ACM SIGKDD Conference on Knowledge Discovery and Data Mining V.1"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3690624.3709338","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3690624.3709338","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,16]],"date-time":"2025-08-16T15:43:22Z","timestamp":1755359002000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3690624.3709338"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,7,20]]},"references-count":60,"alternative-id":["10.1145\/3690624.3709338","10.1145\/3690624"],"URL":"https:\/\/doi.org\/10.1145\/3690624.3709338","relation":{},"subject":[],"published":{"date-parts":[[2025,7,20]]},"assertion":[{"value":"2025-07-20","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}