{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,8]],"date-time":"2026-02-08T07:51:58Z","timestamp":1770537118257,"version":"3.49.0"},"reference-count":96,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,12,26]],"date-time":"2025-12-26T00:00:00Z","timestamp":1766707200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,12,26]],"date-time":"2025-12-26T00:00:00Z","timestamp":1766707200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["The VLDB Journal"],"published-print":{"date-parts":[[2026,1]]},"DOI":"10.1007\/s00778-025-00956-2","type":"journal-article","created":{"date-parts":[[2025,12,26]],"date-time":"2025-12-26T14:08:30Z","timestamp":1766758110000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["TablePuppet: Towards a Generic Framework for Learning over Relational Tables"],"prefix":"10.1007","volume":"35","author":[{"ORCID":"https:\/\/orcid.org\/0009-0003-2013-4241","authenticated-orcid":false,"given":"Lijie","family":"Xu","sequence":"first","affiliation":[]},{"given":"Chulin","family":"Xie","sequence":"additional","affiliation":[]},{"given":"Yiran","family":"Guo","sequence":"additional","affiliation":[]},{"given":"Haiyang","family":"Lu","sequence":"additional","affiliation":[]},{"given":"Gustavo","family":"Alonso","sequence":"additional","affiliation":[]},{"given":"Bo","family":"Li","sequence":"additional","affiliation":[]},{"given":"Guoliang","family":"Li","sequence":"additional","affiliation":[]},{"given":"Wei","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Wentao","family":"Wu","sequence":"additional","affiliation":[]},{"given":"Ce","family":"Zhang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,12,26]]},"reference":[{"key":"956_CR1","unstructured":"MovieLens 1M dataset. https:\/\/grouplens.org\/datasets\/movielens\/1m\/ (2003)"},{"key":"956_CR2","unstructured":"General Data Protection Regulation (GDPR). https:\/\/gdpr-info.eu\/ (2016)"},{"key":"956_CR3","unstructured":"MIMIC-III Clinical Database. https:\/\/physionet.org\/content\/mimiciii\/1.4\/ (2016)"},{"key":"956_CR4","unstructured":"MIMIC-III Benchmarks. https:\/\/github.com\/YerevaNN\/mimic3-benchmarks (2023)"},{"key":"956_CR5","unstructured":"Yelp Open Dataset: An all-purpose dataset for learning. https:\/\/www.yelp.com\/dataset (2023)"},{"key":"956_CR6","unstructured":"DB-Engines. Ranking scores per category in percent. https:\/\/db-engines.com\/en\/ranking_categories?ref=timescale-blog (2024)"},{"key":"956_CR7","unstructured":"Flower: A Friendly Federated AI Framework. https:\/\/github.com\/adap\/flower (2025)"},{"key":"956_CR8","doi-asserted-by":"crossref","unstructured":"Abadi, M., Chu, A., Goodfellow, I., McMahan, H.B., Mironov, I., Talwar, K., Zhang, L.: Deep learning with differential privacy. In: Proceedings of the 2016 ACM SIGSAC conference on computer and communications security, pp. 308\u2013318 (2016)","DOI":"10.1145\/2976749.2978318"},{"key":"956_CR9","doi-asserted-by":"crossref","unstructured":"Arnold, J., Glavic, B., Raicu, I.: A high-performance distributed relational database system for scalable OLAP processing. In: 2019 IEEE International Parallel and Distributed Processing Symposium, IPDPS 2019, Rio de Janeiro, Brazil, May 20-24, 2019, pp. 738\u2013748. IEEE (2019)","DOI":"10.1109\/IPDPS.2019.00083"},{"key":"956_CR10","doi-asserted-by":"crossref","unstructured":"Ben-Or, M., Goldwasser, S., Wigderson, A.: Completeness theorems for non-cryptographic fault-tolerant distributed computation. In: Proceedings of the twentieth annual ACM symposium on Theory of computing, pp. 1\u201310 (1988)","DOI":"10.1145\/62212.62213"},{"key":"956_CR11","doi-asserted-by":"crossref","unstructured":"Bonawitz, K., Ivanov, V., Kreuter, B., Marcedone, A., McMahan, H.B., Patel, S., Ramage, D., Segal, A., Seth, K.: Practical secure aggregation for privacy-preserving machine learning. In: proceedings of the 2017 ACM SIGSAC Conference on Computer and Communications Security, pp. 1175\u20131191 (2017)","DOI":"10.1145\/3133956.3133982"},{"issue":"1","key":"956_CR12","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1561\/2200000016","volume":"3","author":"SP Boyd","year":"2011","unstructured":"Boyd, S.P., Parikh, N., Chu, E., Peleato, B., Eckstein, J.: Distributed optimization and statistical learning via the alternating direction method of multipliers. Found. Trends Mach. Learn. 3(1), 1\u2013122 (2011)","journal-title":"Found. Trends Mach. Learn."},{"issue":"13","key":"956_CR13","doi-asserted-by":"publisher","first-page":"1484","DOI":"10.14778\/2733004.2733020","volume":"7","author":"N Bruno","year":"2014","unstructured":"Bruno, N., Kwon, Y., Wu, M.: Advanced join strategies for large-scale distributed computation. Proc. VLDB Endow. 7(13), 1484\u20131495 (2014)","journal-title":"Proc. VLDB Endow."},{"issue":"12","key":"956_CR14","doi-asserted-by":"publisher","first-page":"2791","DOI":"10.14778\/3476311.3476346","volume":"14","author":"S Castelo","year":"2021","unstructured":"Castelo, S., Rampin, R., Santos, A.S.R., Bessa, A., Chirigati, F., Freire, J.: Auctus: A dataset search engine for data discovery and augmentation. Proc. VLDB Endow. 14(12), 2791\u20132794 (2021)","journal-title":"Proc. VLDB Endow."},{"key":"956_CR15","doi-asserted-by":"crossref","unstructured":"Chaudhuri, S., Motwani, R., Narasayya, V.R.: On random sampling over joins. In: SIGMOD 1999, Proceedings ACM SIGMOD International Conference on Management of Data, June 1-3, 1999, Philadelphia, Pennsylvania, USA, pp. 263\u2013274. ACM Press (1999)","DOI":"10.1145\/304182.304206"},{"issue":"11","key":"956_CR16","doi-asserted-by":"publisher","first-page":"1214","DOI":"10.14778\/3137628.3137633","volume":"10","author":"L Chen","year":"2017","unstructured":"Chen, L., Kumar, A., Naughton, J.F., Patel, J.M.: Towards linear algebra over normalized data. Proc. VLDB Endow. 10(11), 1214\u20131225 (2017)","journal-title":"Proc. VLDB Endow."},{"key":"956_CR17","unstructured":"Chen, T., Jin, X., Sun, Y., Yin, W.: Vafl: A method of vertical asynchronous federated learning. arXiv preprint arXiv:2007.06081 (2020)"},{"issue":"4","key":"956_CR18","doi-asserted-by":"publisher","first-page":"83","DOI":"10.1109\/MIS.2020.2988604","volume":"35","author":"Y Chen","year":"2020","unstructured":"Chen, Y., Qin, X., Wang, J., Yu, C., Gao, W.: Fedhealth: A federated transfer learning framework for wearable healthcare. IEEE Intell. Syst. 35(4), 83\u201393 (2020)","journal-title":"IEEE Intell. Syst."},{"issue":"6","key":"956_CR19","doi-asserted-by":"publisher","first-page":"87","DOI":"10.1109\/MIS.2021.3082561","volume":"36","author":"K Cheng","year":"2021","unstructured":"Cheng, K., Fan, T., Jin, Y., Liu, Y., Chen, T., Papadopoulos, D., Yang, Q.: Secureboost: A lossless federated learning framework. IEEE Intell. Syst. 36(6), 87\u201398 (2021)","journal-title":"IEEE Intell. Syst."},{"issue":"3","key":"956_CR20","doi-asserted-by":"publisher","first-page":"118","DOI":"10.1145\/3654921","volume":"2","author":"B Dai","year":"2024","unstructured":"Dai, B., Hu, X., Yi, K.: Reservoir sampling over joins. Proc. ACM Manag. Data 2(3), 118 (2024)","journal-title":"Proc. ACM Manag. Data"},{"key":"956_CR21","doi-asserted-by":"crossref","unstructured":"Devlin, J., Chang, M., Lee, K., Toutanova, K.: BERT: pre-training of deep bidirectional transformers for language understanding. In: Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, NAACL-HLT 2019, pp. 4171\u20134186 (2019)","DOI":"10.18653\/v1\/N19-1423"},{"key":"956_CR22","unstructured":"Dinh, C.T., Tran, N.H., Nguyen, T.D.: Personalized federated learning with moreau envelopes. In: Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020, December 6-12, 2020, virtual (2020)"},{"key":"956_CR23","volume-title":"The algorithmic foundations of differential privacy","author":"C Dwork","year":"2014","unstructured":"Dwork, C., Roth, A., et al.: The algorithmic foundations of differential privacy, vol. 9. Now Publishers, Inc (2014)"},{"key":"956_CR24","unstructured":"Esmailoghli, M., Quian\u00e9-Ruiz, J., Abedjan, Z.: COCOA: correlation coefficient-aware data augmentation. In: Proceedings of the 24th International Conference on Extending Database Technology, EDBT 2021, Nicosia, Cyprus, March 23 - 26, 2021, pp. 331\u2013336. OpenProceedings.org (2021)"},{"key":"956_CR25","unstructured":"Feng, S., Yu, H.: Multi-participant multi-class vertical federated learning. arXiv preprint arXiv:2001.11154 (2020)"},{"key":"956_CR26","unstructured":"Fernandez, R.C., Min, J., Nava, D., Madden, S.: Lazo: A cardinality-based method for coupled estimation of jaccard similarity and containment. In: 35th IEEE International Conference on Data Engineering, ICDE 2019, Macao, China, April 8-11, 2019, pp. 1190\u20131201. IEEE (2019)"},{"issue":"10","key":"956_CR27","doi-asserted-by":"publisher","first-page":"2111","DOI":"10.14778\/3547305.3547316","volume":"15","author":"F Fu","year":"2022","unstructured":"Fu, F., Miao, X., Jiang, J., Xue, H., Cui, B.: Towards communication-efficient vertical federated learning training via cache-enabled local update. Proc. VLDB Endow. 15(10), 2111\u20132120 (2022)","journal-title":"Proc. VLDB Endow."},{"key":"956_CR28","doi-asserted-by":"crossref","unstructured":"Fu, F., Shao, Y., Yu, L., Jiang, J., Xue, H., Tao, Y., Cui, B.: Vf$$ ^{\\text{2}}$$boost: Very fast vertical federated gradient boosting for cross-enterprise learning. In: SIGMOD \u201921: International Conference on Management of Data, 2021, pp. 563\u2013576. ACM (2021)","DOI":"10.1145\/3448016.3457241"},{"key":"956_CR29","doi-asserted-by":"crossref","unstructured":"Galhotra, S., Gong, Y., Fernandez, R.C.: Metam: Goal-oriented data discovery. In: 39th IEEE International Conference on Data Engineering, ICDE 2023, Anaheim, CA, USA, April 3-7, 2023, pp. 2780\u20132793. IEEE (2023)","DOI":"10.1109\/ICDE55515.2023.00213"},{"key":"956_CR30","doi-asserted-by":"crossref","unstructured":"Getoor, L., Taskar, B.: Introduction to Statistical Relational Learning (Adaptive Computation and Machine Learning). The MIT Press (2007)","DOI":"10.7551\/mitpress\/7432.001.0001"},{"key":"956_CR31","first-page":"27131","volume":"34","author":"B Ghazi","year":"2021","unstructured":"Ghazi, B., Golowich, N., Kumar, R., Manurangsi, P., Zhang, C.: Deep learning with label differential privacy. Adv. Neural. Inf. Process. Syst. 34, 27131\u201327145 (2021)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"956_CR32","unstructured":"Gilad-Bachrach, R., Dowlin, N., Laine, K., Lauter, K., Naehrig, M., Wernsing, J.: Cryptonets: Applying neural networks to encrypted data with high throughput and accuracy. In: International Conference on Machine Learning, pp. 201\u2013210. PMLR (2016)"},{"key":"956_CR33","doi-asserted-by":"crossref","unstructured":"Gong, Y., Zhu, Z., Galhotra, S., Fernandez, R.C.: Ver: View discovery in the wild. In: 39th IEEE International Conference on Data Engineering, ICDE 2023, Anaheim, CA, USA, April 3-7, 2023, pp. 503\u2013516. IEEE (2023)","DOI":"10.1109\/ICDE55515.2023.00045"},{"key":"956_CR34","unstructured":"Grinsztajn, L., Oyallon, E., Varoquaux, G.: Why do tree-based models still outperform deep learning on typical tabular data? In: Advances in Neural Information Processing Systems 35: Annual Conference on Neural Information Processing Systems 2022, NeurIPS 2022, New Orleans, LA, USA, November 28 - December 9, 2022 (2022)"},{"key":"956_CR35","doi-asserted-by":"crossref","unstructured":"Gu, B., Dang, Z., Li, X., Huang, H.: Federated doubly stochastic kernel learning for vertically partitioned data. In: Proceedings of the 26th ACM SIGKDD International Conference on Knowledge Discovery & Data Mining, pp. 2483\u20132493 (2020)","DOI":"10.1145\/3394486.3403298"},{"issue":"11","key":"956_CR36","doi-asserted-by":"publisher","first-page":"6103","DOI":"10.1109\/TNNLS.2021.3072238","volume":"33","author":"B Gu","year":"2022","unstructured":"Gu, B., Xu, A., Huo, Z., Deng, C., Huang, H.: Privacy-preserving asynchronous vertical federated learning algorithms for multiparty collaborative learning. IEEE Trans. Neural Networks Learn. Syst. 33(11), 6103\u20136115 (2022)","journal-title":"IEEE Trans. Neural Networks Learn. Syst."},{"key":"956_CR37","doi-asserted-by":"publisher","unstructured":"Han, Y., Du, P., Yang, K.: Fedgbf: An efficient vertical federated learning framework via gradient boosting and bagging. CoRR abs\/2204.00976 (2022). https:\/\/doi.org\/10.48550\/arXiv.2204.00976","DOI":"10.48550\/arXiv.2204.00976"},{"key":"956_CR38","unstructured":"Hardy, S., Henecka, W., Ivey-Law, H., Nock, R., Patrini, G., Smith, G., Thorne, B.: Private federated learning on vertically partitioned data via entity resolution and additively homomorphic encryption. arXiv preprint arXiv:1711.10677 (2017)"},{"issue":"1","key":"956_CR39","doi-asserted-by":"publisher","first-page":"96","DOI":"10.1038\/s41597-019-0103-9","volume":"6","author":"H Harutyunyan","year":"2019","unstructured":"Harutyunyan, H., Khachatrian, H., Kale, D.C., Ver Steeg, G., Galstyan, A.: Multitask learning and benchmarking with clinical time series data. Scientific Data 6(1), 96 (2019)","journal-title":"Scientific Data"},{"issue":"1","key":"956_CR40","doi-asserted-by":"publisher","first-page":"337","DOI":"10.1137\/140990309","volume":"26","author":"M Hong","year":"2016","unstructured":"Hong, M., Luo, Z.Q., Razaviyayn, M.: Convergence analysis of alternating direction method of multipliers for a family of nonconvex problems. SIAM J. Optim. 26(1), 337\u2013364 (2016)","journal-title":"SIAM J. Optim."},{"key":"956_CR41","unstructured":"Hu, Y., Liu, P., Kong, L., Niu, D.: Learning privately over distributed features: An admm sharing approach. arXiv preprint arXiv:1907.07735 (2019)"},{"key":"956_CR42","doi-asserted-by":"crossref","unstructured":"Hu, Y., Niu, D., Yang, J., Zhou, S.: Fdml: A collaborative machine learning framework for distributed features. In: Proceedings of the 25th ACM SIGKDD International Conference on Knowledge Discovery & Data Mining, pp. 2232\u20132240 (2019)","DOI":"10.1145\/3292500.3330765"},{"key":"956_CR43","unstructured":"Jin, X., Chen, P.Y., Hsu, C.Y., Yu, C.M., Chen, T.: Catastrophic data leakage in vertical federated learning. Advances in Neural Information Processing Systems 34 (2021)"},{"key":"956_CR44","unstructured":"Karimireddy, S.P., Kale, S., Mohri, M., Reddi, S.J., Stich, S.U., Suresh, A.T.: SCAFFOLD: stochastic controlled averaging for federated learning. In: Proceedings of the 37th International Conference on Machine Learning, ICML 2020, 13-18 July 2020, Virtual Event, Proceedings of Machine Learning Research, vol. 119, pp. 5132\u20135143. PMLR (2020)"},{"key":"956_CR45","doi-asserted-by":"publisher","unstructured":"Khan, A., ten Thij, M., Wilbik, A.: Vertical federated learning: A structured literature review. CoRR abs\/2212.00622 (2022). https:\/\/doi.org\/10.48550\/arXiv.2212.00622","DOI":"10.48550\/arXiv.2212.00622"},{"issue":"3","key":"956_CR46","doi-asserted-by":"publisher","first-page":"443","DOI":"10.1145\/319732.319745","volume":"7","author":"W Kim","year":"1982","unstructured":"Kim, W.: On optimizing an sql-like nested query. ACM Trans. Database Syst. 7(3), 443\u2013469 (1982)","journal-title":"ACM Trans. Database Syst."},{"key":"956_CR47","unstructured":"Kone\u010dn\u00fd, J., McMahan, H.B., Ramage, D., Richt\u00e1rik, P.: Federated optimization: Distributed machine learning for on-device intelligence. CoRR abs\/1610.02527 (2016). http:\/\/arxiv.org\/abs\/1610.02527"},{"key":"956_CR48","unstructured":"Kone\u010dn\u00fd, J., McMahan, H.B., Yu, F.X., Richt\u00e1rik, P., Suresh, A.T., Bacon, D.: Federated learning: Strategies for improving communication efficiency. CoRR abs\/1610.05492 (2016). http:\/\/arxiv.org\/abs\/1610.05492"},{"issue":"4","key":"956_CR49","doi-asserted-by":"publisher","first-page":"422","DOI":"10.1145\/371578.371598","volume":"32","author":"D Kossmann","year":"2000","unstructured":"Kossmann, D.: The state of the art in distributed query processing. ACM Comput. Surv. 32(4), 422\u2013469 (2000)","journal-title":"ACM Comput. Surv."},{"key":"956_CR50","doi-asserted-by":"crossref","unstructured":"Kumar, A., Naughton, J.F., Patel, J.M.: Learning generalized linear models over normalized data. In: Proceedings of the 2015 ACM SIGMOD International Conference on Management of Data, pp. 1969\u20131984. ACM (2015)","DOI":"10.1145\/2723372.2723713"},{"key":"956_CR51","doi-asserted-by":"crossref","unstructured":"Kumar, A., Naughton, J.F., Patel, J.M., Zhu, X.: To join or not to join?: Thinking twice about joins before feature selection. In: Proceedings of the 2016 International Conference on Management of Data, SIGMOD Conference 2016, San Francisco, CA, USA, June 26 - July 01, 2016, pp. 19\u201334. ACM (2016)","DOI":"10.1145\/2882903.2882952"},{"key":"956_CR52","doi-asserted-by":"crossref","unstructured":"Li, Q., Diao, Y., Chen, Q., He, B.: Federated learning on non-iid data silos: An experimental study. In: 38th IEEE International Conference on Data Engineering, ICDE 2022, pp. 965\u2013978. IEEE (2022)","DOI":"10.1109\/ICDE53745.2022.00077"},{"issue":"4","key":"956_CR53","doi-asserted-by":"publisher","first-page":"828","DOI":"10.14778\/3503585.3503592","volume":"15","author":"J Liu","year":"2021","unstructured":"Liu, J., Lou, J., Xiong, L., Liu, J., Meng, X.: Projected federated averaging with heterogeneous differential privacy. Proc. VLDB Endow. 15(4), 828\u2013840 (2021)","journal-title":"Proc. VLDB Endow."},{"issue":"4","key":"956_CR54","doi-asserted-by":"publisher","first-page":"70","DOI":"10.1109\/MIS.2020.2988525","volume":"35","author":"Y Liu","year":"2020","unstructured":"Liu, Y., Kang, Y., Xing, C., Chen, T., Yang, Q.: A secure federated transfer learning framework. IEEE Intell. Syst. 35(4), 70\u201382 (2020)","journal-title":"IEEE Intell. Syst."},{"key":"956_CR55","unstructured":"Liu, Y., Kang, Y., Zhang, X., Li, L., Cheng, Y., Chen, T., Hong, M., Yang, Q.: A communication efficient collaborative learning framework for distributed features. arXiv preprint arXiv:1912.11187 (2019)"},{"key":"956_CR56","doi-asserted-by":"publisher","unstructured":"Liu, Y., Kang, Y., Zou, T., Pu, Y., He, Y., Ye, X., Ouyang, Y., Zhang, Y., Yang, Q.: Vertical federated learning: Concepts, advances and challenges. CoRR abs\/2211.12814 (2023). https:\/\/doi.org\/10.48550\/arXiv.2211.12814","DOI":"10.48550\/arXiv.2211.12814"},{"key":"956_CR57","doi-asserted-by":"crossref","unstructured":"Lu, L., Ding, N.: Multi-party private set intersection in vertical federated learning. In: 19th IEEE International Conference on Trust, Security and Privacy in Computing and Communications, TrustCom 2020, pp. 707\u2013714. IEEE (2020)","DOI":"10.1109\/TrustCom50675.2020.00098"},{"key":"956_CR58","doi-asserted-by":"crossref","unstructured":"Ma, J., Zhang, Q., Lou, J., Ho, J.C., Xiong, L., Jiang, X.: Privacy-preserving tensor factorization for collaborative health data analysis. In: Proceedings of the 28th ACM International Conference on Information and Knowledge Management, CIKM 2019, Beijing, China, November 3-7, 2019, pp. 1291\u20131300. ACM (2019)","DOI":"10.1145\/3357384.3357878"},{"key":"956_CR59","first-page":"6934","volume":"34","author":"M Malek Esmaeili","year":"2021","unstructured":"Malek Esmaeili, M., Mironov, I., Prasad, K., Shilov, I., Tramer, F.: Antipodes of label differential privacy: Pate and alibi. Adv. Neural. Inf. Process. Syst. 34, 6934\u20136945 (2021)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"key":"956_CR60","unstructured":"McMahan, B., Moore, E., Ramage, D., Hampson, S., y\u00a0Arcas, B.A.: Communication-efficient learning of deep networks from decentralized data. In: Proceedings of the 20th International Conference on Artificial Intelligence and Statistics, AISTATS 2017, vol.\u00a054, pp. 1273\u20131282. PMLR (2017)"},{"key":"956_CR61","doi-asserted-by":"crossref","unstructured":"Mohassel, P., Rindal, P., Rosulek, M.: Fast database joins and PSI for secret shared data. In: CCS \u201920: 2020 ACM SIGSAC Conference on Computer and Communications Security, 2020, pp. 1271\u20131287. ACM (2020)","DOI":"10.1145\/3372297.3423358"},{"key":"956_CR62","unstructured":"Moritz, P., Nishihara, R., Wang, S., Tumanov, A., Liaw, R., Liang, E., Elibol, M., Yang, Z., Paul, W., Jordan, M.I., Stoica, I.: Ray: A distributed framework for emerging AI applications. In: 13th USENIX Symposium on Operating Systems Design and Implementation, OSDI 2018, Carlsbad, CA, USA, October 8-10, 2018, pp. 561\u2013577. USENIX Association (2018)"},{"key":"956_CR63","doi-asserted-by":"crossref","unstructured":"Nargesian, F., Pu, K.Q., Zhu, E., Bashardoost, B.G., Miller, R.J.: Organizing data lakes for navigation. In: Proceedings of the 2020 International Conference on Management of Data, SIGMOD Conference 2020, online conference [Portland, OR, USA], June 14-19, 2020, pp. 1939\u20131950. ACM (2020)","DOI":"10.1145\/3318464.3380605"},{"issue":"12","key":"956_CR64","doi-asserted-by":"publisher","first-page":"3502","DOI":"10.14778\/3415478.3415572","volume":"13","author":"D Olteanu","year":"2020","unstructured":"Olteanu, D.: The relational data borg is learning. Proc. VLDB Endow. 13(12), 3502\u20133515 (2020)","journal-title":"Proc. VLDB Endow."},{"key":"956_CR65","doi-asserted-by":"publisher","unstructured":"Overman, T., Blum, G., Klabjan, D.: A primal-dual algorithm for hybrid federated learning. CoRR abs\/2210.08106 (2022). https:\/\/doi.org\/10.48550\/arXiv.2210.08106","DOI":"10.48550\/arXiv.2210.08106"},{"key":"956_CR66","doi-asserted-by":"crossref","unstructured":"Picado, J., Termehchy, A., Fern, A., Ataei, P.: Schema independent relational learning. In: Proceedings of the 2017 ACM International Conference on Management of Data, SIGMOD Conference 2017, Chicago, IL, USA, May 14-19, 2017, pp. 929\u2013944. ACM (2017)","DOI":"10.1145\/3035918.3035923"},{"key":"956_CR67","unstructured":"Raedt, L.D., Kersting, K., Natarajan, S., Poole, D.: Statistical Relational Artificial Intelligence: Logic, Probability, and Computation. Synthesis Lectures on Artificial Intelligence and Machine Learning. Morgan & Claypool Publishers (2016)"},{"key":"956_CR68","unstructured":"Ramakrishnan, R., Gehrke, J.: Database management systems (3. ed.). McGraw-Hill (2003)"},{"key":"956_CR69","doi-asserted-by":"crossref","unstructured":"Rouhani, B.D., Riazi, M.S., Koushanfar, F.: DeepSecure: Scalable provably-secure deep learning. In: Proceedings of the 55th Annual Design Automation Conference, pp. 1\u20136 (2018)","DOI":"10.1145\/3195970.3196023"},{"issue":"1","key":"956_CR70","doi-asserted-by":"publisher","first-page":"35","DOI":"10.3233\/IA-200075","volume":"15","author":"S Saha","year":"2021","unstructured":"Saha, S., Ahmad, T.: Federated transfer learning: Concept and applications. Intelligenza Artificiale 15(1), 35\u201344 (2021)","journal-title":"Intelligenza Artificiale"},{"issue":"12","key":"956_CR71","doi-asserted-by":"publisher","first-page":"1854","DOI":"10.14778\/3352063.3352083","volume":"12","author":"SS Sandha","year":"2019","unstructured":"Sandha, S.S., Cabrera, W., Al-Kateb, M., Nair, S., Srivastava, M.B.: In-database distributed machine learning: Demonstration using teradata SQL engine. Proc. VLDB Endow. 12(12), 1854\u20131857 (2019)","journal-title":"Proc. VLDB Endow."},{"key":"956_CR72","doi-asserted-by":"crossref","unstructured":"Santos, A.S.R., Bessa, A., Chirigati, F., Musco, C., Freire, J.: Correlation sketches for approximate join-correlation queries. In: SIGMOD \u201921: International Conference on Management of Data, Virtual Event, China, June 20-25, 2021, pp. 1531\u20131544. ACM (2021)","DOI":"10.1145\/3448016.3458456"},{"key":"956_CR73","unstructured":"Schleich, M.: Structure-aware machine learning over multi-relational databases. Ph.D. thesis, University of Oxford, UK (2020). https:\/\/ethos.bl.uk\/OrderDetails.do?uin=uk.bl.ethos.808366"},{"key":"956_CR74","doi-asserted-by":"crossref","unstructured":"Schleich, M., Olteanu, D., Ciucanu, R.: Learning linear regression models over factorized joins. In: Proceedings of the 2016 International Conference on Management of Data, SIGMOD Conference 2016, pp. 3\u201318. ACM (2016)","DOI":"10.1145\/2882903.2882939"},{"key":"956_CR75","doi-asserted-by":"crossref","unstructured":"Schleich, M., Olteanu, D., Khamis, M.A., Ngo, H.Q., Nguyen, X.: A layered aggregate engine for analytics workloads. In: Proceedings of the 2019 International Conference on Management of Data, SIGMOD Conference 2019, pp. 1642\u20131659. ACM (2019)","DOI":"10.1145\/3299869.3324961"},{"key":"956_CR76","doi-asserted-by":"crossref","unstructured":"Schleich, M., Olteanu, D., Khamis, M.A., Ngo, H.Q., Nguyen, X.: Learning models over relational data: A brief tutorial. In: Scalable Uncertainty Management - 13th International Conference, SUM 2019, Compi\u00e8gne, France, December 16-18, 2019, Proceedings, Lecture Notes in Computer Science, vol. 11940, pp. 423\u2013432. Springer (2019)","DOI":"10.1007\/978-3-030-35514-2_32"},{"issue":"1","key":"956_CR77","doi-asserted-by":"publisher","first-page":"48","DOI":"10.1145\/5236.5241","volume":"11","author":"A Segev","year":"1986","unstructured":"Segev, A.: Optimization of join operations in horizontally partitioned database systems. ACM Trans. Database Syst. 11(1), 48\u201380 (1986)","journal-title":"ACM Trans. Database Syst."},{"key":"956_CR78","unstructured":"Shekelyan, M., Cormode, G., Ma, Q., Shanghooshabad, A.M., Triantafillou, P.: Streaming weighted sampling over join queries. In: Proceedings 26th International Conference on Extending Database Technology, EDBT 2023, Ioannina, Greece, March 28-31, 2023, pp. 298\u2013310 (2023)"},{"key":"956_CR79","unstructured":"Ullman, J.D.: Principles of Database and Knowledge-Base Systems, Volume I. Computer Science Press (1988)"},{"key":"956_CR80","unstructured":"Vepakomma, P., Gupta, O., Swedish, T., Raskar, R.: Split learning for health: Distributed deep learning without sharing raw patient data. arXiv preprint arXiv:1812.00564 (2018)"},{"key":"956_CR81","doi-asserted-by":"publisher","first-page":"5234","DOI":"10.1109\/TSP.2021.3106104","volume":"69","author":"J Wang","year":"2021","unstructured":"Wang, J., Liu, Q., Liang, H., Joshi, G., Poor, H.V.: A novel framework for the analysis and design of heterogeneous federated learning. IEEE Trans. Signal Process. 69, 5234\u20135249 (2021)","journal-title":"IEEE Trans. Signal Process."},{"issue":"12","key":"956_CR82","doi-asserted-by":"publisher","first-page":"2090","DOI":"10.14778\/3407790.3407811","volume":"13","author":"Y Wu","year":"2020","unstructured":"Wu, Y., Cai, S., Xiao, X., Chen, G., Ooi, B.C.: Privacy preserving vertical federated learning for tree-based models. Proceedings of the VLDB Endowment 13(12), 2090\u20132103 (2020)","journal-title":"Proceedings of the VLDB Endowment"},{"key":"956_CR83","doi-asserted-by":"publisher","unstructured":"Xie, C., Chen, P., Zhang, C., Li, B.: Improving privacy-preserving vertical federated learning by efficient communication with ADMM. CoRR abs\/2207.10226 (2022). https:\/\/doi.org\/10.48550\/arXiv.2207.10226","DOI":"10.48550\/arXiv.2207.10226"},{"key":"956_CR84","doi-asserted-by":"crossref","unstructured":"Xie, Y., Wang, Z., Gao, D., Chen, D., Yao, L., Kuang, W., Li, Y., Ding, B., Zhou, J.: Federatedscope: A flexible federated learning platform for heterogeneity. Proc. VLDB Endow. 16(5), 1059\u20131072 (2023)","DOI":"10.14778\/3579075.3579081"},{"key":"956_CR85","unstructured":"Xu, Z., De, S., Figueiredo, M.A.T., Studer, C., Goldstein, T.: An empirical study of ADMM for nonconvex problems. CoRR abs\/1612.03349 (2016)"},{"key":"956_CR86","doi-asserted-by":"crossref","unstructured":"Yakout, M., Ganjam, K., Chakrabarti, K., Chaudhuri, S.:ACM,: Infogather: entity augmentation and attribute discovery by holistic matching with web tables. Presented at the (2012)","DOI":"10.1145\/2213836.2213848"},{"key":"956_CR87","doi-asserted-by":"crossref","unstructured":"Yang, K., Gao, Y., Liang, L., Yao, B., Wen, S., Chen, G.: Towards factorized SVM with gaussian kernels over normalized data. In: 36th IEEE International Conference on Data Engineering, ICDE 2020, Dallas, TX, USA, April 20-24, 2020, pp. 1453\u20131464. IEEE (2020)","DOI":"10.1109\/ICDE48307.2020.00129"},{"key":"956_CR88","doi-asserted-by":"publisher","unstructured":"Yang, Q., Liu, Y., Chen, T., Tong, Y.: Federated machine learning: Concept and applications. ACM Trans. Intell. Syst. Technol. 10(2), 12:1\u201312:19 (2019). https:\/\/doi.org\/10.1145\/3298981","DOI":"10.1145\/3298981"},{"key":"956_CR89","unstructured":"Yang, S., Ren, B., Zhou, X., Liu, L.: Parallel distributed logistic regression for vertical federated learning without third-party coordinator. arXiv preprint arXiv:1911.09824 (2019)"},{"key":"956_CR90","unstructured":"Yousefpour, A., Shilov, I., Sablayrolles, A., Testuggine, D., Prasad, K., Malek, M., Nguyen, J., Ghosh, S., Bharadwaj, A., Zhao, J., Cormode, G., Mironov, I.: Opacus: User-friendly differential privacy library in pytorch. CoRR abs\/2109.12298 (2021). https:\/\/arxiv.org\/abs\/2109.12298"},{"issue":"3","key":"956_CR91","doi-asserted-by":"publisher","first-page":"197","DOI":"10.14778\/2735508.2735510","volume":"8","author":"Q Zeng","year":"2014","unstructured":"Zeng, Q., Patel, J.M., Page, D.: Quickfoil: Scalable inductive logic programming. Proc. VLDB Endow. 8(3), 197\u2013208 (2014)","journal-title":"Proc. VLDB Endow."},{"key":"956_CR92","first-page":"10896","volume":"35","author":"Q Zhang","year":"2021","unstructured":"Zhang, Q., Gu, B., Deng, C., Huang, H.: Secure bilevel asynchronous vertical federated learning with backward updating. In: Proceedings of the AAAI Conference on Artificial Intelligence 35, 10896\u201310904 (2021)","journal-title":"In: Proceedings of the AAAI Conference on Artificial Intelligence"},{"key":"956_CR93","unstructured":"Zhang, X., Yin, W., Hong, M., Chen, T.: Hybrid federated learning: Algorithms and implementation. CoRR abs\/2012.12420 (2020). https:\/\/arxiv.org\/abs\/2012.12420"},{"key":"956_CR94","doi-asserted-by":"crossref","unstructured":"Zhao, Z., Christensen, R., Li, F., Hu, X., Yi, K.: Random sampling over joins revisited. In: Proceedings of the 2018 International Conference on Management of Data, SIGMOD Conference 2018, Houston, TX, USA, June 10-15, 2018, pp. 1525\u20131539. ACM (2018)","DOI":"10.1145\/3183713.3183739"},{"key":"956_CR95","doi-asserted-by":"crossref","unstructured":"Zhou, Z., Tian, Y., Peng, C.: Privacy-preserving federated learning framework with general aggregation and multiparty entity matching. Wirel. Commun. Mob. Comput. 2021, 6692,061:1\u20136692,061:14 (2021)","DOI":"10.1155\/2021\/6692061"},{"issue":"12","key":"956_CR96","doi-asserted-by":"publisher","first-page":"1185","DOI":"10.14778\/2994509.2994534","volume":"9","author":"E Zhu","year":"2016","unstructured":"Zhu, E., Nargesian, F., Pu, K.Q., Miller, R.J.: LSH ensemble: Internet-scale domain search. Proc. VLDB Endow. 9(12), 1185\u20131196 (2016)","journal-title":"Proc. VLDB Endow."}],"container-title":["The VLDB Journal"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00778-025-00956-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00778-025-00956-2","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00778-025-00956-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,2,7]],"date-time":"2026-02-07T07:27:55Z","timestamp":1770449275000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00778-025-00956-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,12,26]]},"references-count":96,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2026,1]]}},"alternative-id":["956"],"URL":"https:\/\/doi.org\/10.1007\/s00778-025-00956-2","relation":{},"ISSN":["1066-8888","0949-877X"],"issn-type":[{"value":"1066-8888","type":"print"},{"value":"0949-877X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,12,26]]},"assertion":[{"value":"7 February 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"8 October 2025","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 November 2025","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"26 December 2025","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"6"}}