{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T07:19:22Z","timestamp":1740122362557,"version":"3.37.3"},"reference-count":40,"publisher":"Springer Science and Business Media LLC","issue":"6","license":[{"start":{"date-parts":[[2024,8,17]],"date-time":"2024-08-17T00:00:00Z","timestamp":1723852800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,8,17]],"date-time":"2024-08-17T00:00:00Z","timestamp":1723852800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Data Min Knowl Disc"],"published-print":{"date-parts":[[2024,11]]},"DOI":"10.1007\/s10618-024-01054-7","type":"journal-article","created":{"date-parts":[[2024,8,17]],"date-time":"2024-08-17T14:02:20Z","timestamp":1723903340000},"page":"3643-3689","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Bayesian network Motifs for reasoning over heterogeneous unlinked datasets"],"prefix":"10.1007","volume":"38","author":[{"given":"Yi","family":"Sui","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Alex","family":"Kwan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Alexander W.","family":"Olson","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7984-8394","authenticated-orcid":false,"given":"Scott","family":"Sanner","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Daniel A.","family":"Silver","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2024,8,17]]},"reference":[{"key":"1054_CR1","doi-asserted-by":"publisher","first-page":"67","DOI":"10.1016\/j.csda.2019.02.004","volume":"137","author":"L Azzimonti","year":"2019","unstructured":"Azzimonti L, Corani G, Zaffalon M (2019) Hierarchical estimation of parameters in Bayesian networks. Comput Stat Data Anal 137:67\u201391. https:\/\/doi.org\/10.1016\/j.csda.2019.02.004","journal-title":"Comput Stat Data Anal"},{"unstructured":"Azzimonti L, Corani G, Scutari M (2020) Structure Learning from Related Data Sets with a Hierarchical Bayesian Score. In: Jaeger M, Nielsen TD (eds) Proceedings of the 10th International Conference on Probabilistic Graphical Models. Proceedings of Machine Learning Research, vol. 138, pp. 5\u201316. PMLR, ???","key":"1054_CR2"},{"doi-asserted-by":"crossref","unstructured":"Bhattacharya P, Gavrilova ML (2007) Voronoi diagram in optimal path planning. In: 4th International Symposium on Voronoi Diagrams in Science and Engineering (ISVD 2007), pp. 38\u201347","key":"1054_CR3","DOI":"10.1109\/ISVD.2007.43"},{"doi-asserted-by":"publisher","unstructured":"Carpenter J, Kenward M (2012). Multiple imputation and its application. https:\/\/doi.org\/10.1002\/9781119942283","key":"1054_CR4","DOI":"10.1002\/9781119942283"},{"unstructured":"Chicago C. Chicago Community Area Boundaries. https:\/\/data.cityofchicago.org\/Facilities-Geographic-Boundaries\/Boundaries-Community-Areas-current-\/cauq-8yn6","key":"1054_CR5"},{"doi-asserted-by":"publisher","unstructured":"Christen P (2012). Data Matching. https:\/\/doi.org\/10.1007\/978-3-642-31164-2","key":"1054_CR6","DOI":"10.1007\/978-3-642-31164-2"},{"key":"1054_CR7","doi-asserted-by":"publisher","first-page":"297","DOI":"10.1001\/jama.2013.8267","volume":"310","author":"W Chung","year":"2013","unstructured":"Chung W, Buseman C, Joyner S, Hughes S, Fomby T, Luby J, Haley R (2013) The 2012 west Nile encephalitis epidemic in Dallas, Texas. JAMA J Am Med Assoc 310:297\u2013307. https:\/\/doi.org\/10.1001\/jama.2013.8267","journal-title":"JAMA J Am Med Assoc"},{"unstructured":"Company CB. CBC Vote Compass 2014 Toronto. https:\/\/www.cbc.ca\/news2\/interactives\/votecompass\/toronto2014.html","key":"1054_CR8"},{"issue":"3\u20134","key":"1054_CR9","doi-asserted-by":"publisher","first-page":"197","DOI":"10.1561\/1900000052","volume":"7","author":"GV den Broeck","year":"2017","unstructured":"den Broeck GV, Suciu D (2017) Query processing on probabilistic data: a survey. Found Trends Datab 7(3\u20134):197\u2013341. https:\/\/doi.org\/10.1561\/1900000052","journal-title":"Found Trends Datab"},{"key":"1054_CR10","doi-asserted-by":"publisher","first-page":"59","DOI":"10.1016\/S0933-3657(97)00384-9","volume":"10","author":"F D\u00edez","year":"1997","unstructured":"D\u00edez F, Mira J, Iturralde E, Zubillaga S (1997) Diaval, a Bayesian expert system for echocardiography. Artif Intell Med 10:59\u201373. https:\/\/doi.org\/10.1016\/S0933-3657(97)00384-9","journal-title":"Artif Intell Med"},{"key":"1054_CR11","doi-asserted-by":"publisher","first-page":"295","DOI":"10.1162\/153244304773633834","volume":"4","author":"M Druzdzel","year":"2003","unstructured":"Druzdzel M, D\u00edez F (2003) Combining knowledge from different sources in causal probabilistic models. J Mach Learn Res 4:295\u2013316. https:\/\/doi.org\/10.1162\/153244304773633834","journal-title":"J Mach Learn Res"},{"key":"1054_CR12","doi-asserted-by":"publisher","first-page":"293","DOI":"10.1080\/13645570802394003","volume":"12","author":"G Durrant","year":"2009","unstructured":"Durrant G (2009) Imputation methods for handling item-nonresponse in practice: methodological issues and recent debates. Int J Soc Res Methodol 12:293\u2013304. https:\/\/doi.org\/10.1080\/13645570802394003","journal-title":"Int J Soc Res Methodol"},{"doi-asserted-by":"publisher","unstructured":"Duschka O, Genesereth M (1997) Answering recursive queries using views. Proceedings of the ACM SIGACT-SIGMOD-SIGART Symposium on Principles of Database Systems - PODS. https:\/\/doi.org\/10.1145\/263661.263674","key":"1054_CR13","DOI":"10.1145\/263661.263674"},{"issue":"328","key":"1054_CR14","doi-asserted-by":"publisher","first-page":"1183","DOI":"10.1080\/01621459.1969.10501049","volume":"64","author":"IP Fellegi","year":"1969","unstructured":"Fellegi IP, Sunter AB (1969) A theory for record linkage. J Am Stat Assoc 64(328):1183\u20131210. https:\/\/doi.org\/10.1080\/01621459.1969.10501049","journal-title":"J Am Stat Assoc"},{"doi-asserted-by":"publisher","unstructured":"Getoor L, Mihalkova L (2011) Learning statistical models from relational data, pp. 1195\u20131198.https:\/\/doi.org\/10.1145\/1989323.1989451","key":"1054_CR15","DOI":"10.1145\/1989323.1989451"},{"doi-asserted-by":"crossref","unstructured":"Getoor L, Taskar B (2007) Introduction to Statistical Relational Learning. MIT Press, ???","key":"1054_CR16","DOI":"10.7551\/mitpress\/7432.001.0001"},{"key":"1054_CR17","doi-asserted-by":"publisher","first-page":"15437","DOI":"10.1371\/journal.pone.0015437","volume":"5","author":"R Harrigan","year":"2010","unstructured":"Harrigan R, Thomassen H, Buermann W, Cummings R, Kahn M, Smith T (2010) Economic conditions predict prevalence of west Nile virus. PloS one 5:15437. https:\/\/doi.org\/10.1371\/journal.pone.0015437","journal-title":"PloS one"},{"doi-asserted-by":"crossref","unstructured":"Harron K, Goldstein H, Dibben C (2015) Methodological developments in data linkage","key":"1054_CR18","DOI":"10.1002\/9781119072454"},{"key":"1054_CR19","first-page":"10367","volume":"35","author":"S Jin","year":"2022","unstructured":"Jin S, Komaragiri V, Rahman T, Gogate V (2022) Learning tractable probabilistic models from inconsistent local estimates. Adv Neural Inf Process Syst 35:10367\u201310379","journal-title":"Adv Neural Inf Process Syst"},{"key":"1054_CR20","doi-asserted-by":"publisher","DOI":"10.2307\/41720674","author":"J-k Kim","year":"2012","unstructured":"Kim J-k, Rao J (2012) Combining data from two independent surveys: a model-assisted approach. Biometrika. https:\/\/doi.org\/10.2307\/41720674","journal-title":"Biometrika"},{"doi-asserted-by":"publisher","unstructured":"Koller D (1999) Probabilistic relational models, pp. 3\u201313. https:\/\/doi.org\/10.1007\/3-540-48751-4_1","key":"1054_CR21","DOI":"10.1007\/3-540-48751-4_1"},{"unstructured":"Levy A, Rajaraman A, Ordille J (1996) Querying heterogeneous information sources using source descriptions. VLDB","key":"1054_CR22"},{"key":"1054_CR23","doi-asserted-by":"publisher","first-page":"293","DOI":"10.1214\/16-STS584","volume":"32","author":"S Lohr","year":"2017","unstructured":"Lohr S, Raghunathan T (2017) Combining survey data with other data sources. Stat Sci 32:293\u2013312. https:\/\/doi.org\/10.1214\/16-STS584","journal-title":"Stat Sci"},{"key":"1054_CR24","doi-asserted-by":"publisher","first-page":"1019","DOI":"10.2307\/27590779","volume":"101","author":"S Lohr","year":"2006","unstructured":"Lohr S, Rao JNK (2006) Estimation in multiple-frame surveys. J Am Stat Assoc 101:1019\u20131030. https:\/\/doi.org\/10.2307\/27590779","journal-title":"J Am Stat Assoc"},{"unstructured":"McGregor M, Moore A, Stephenson L. The Toronto Election Study. http:\/\/www.torontoelectionstudy.com\/data","key":"1054_CR25"},{"unstructured":"McGregor M, Moore A, Stephenson L. What is aggregate-level data? https:\/\/www.cihi.ca\/en\/faq\/what-is-aggregate-level-data","key":"1054_CR26"},{"key":"1054_CR27","doi-asserted-by":"publisher","first-page":"1512","DOI":"10.1002\/sim.3566","volume":"28","author":"P Metcalf","year":"2009","unstructured":"Metcalf P, Scott A (2009) Using multiple frames in health surveys. Stat Med 28:1512\u201323. https:\/\/doi.org\/10.1002\/sim.3566","journal-title":"Stat Med"},{"issue":"8","key":"1054_CR28","doi-asserted-by":"publisher","first-page":"9171","DOI":"10.1609\/aaai.v37i8.26100","volume":"37","author":"O Mian","year":"2023","unstructured":"Mian O, Kamp M, Vreeken J (2023) Information-theoretic causal discovery and intervention detection over multiple environments. Proc AAAI Conf Artif Intell 37(8):9171\u20139179. https:\/\/doi.org\/10.1609\/aaai.v37i8.26100","journal-title":"Proc AAAI Conf Artif Intell"},{"unstructured":"of Public Health\u00a0(CDPH) CD. West Nile Virus Prediction. https:\/\/www.kaggle.com\/c\/predict-west-nile-virus\/data","key":"1054_CR29"},{"unstructured":"Planning TC (2011) Toronto Ward Profiles. https:\/\/open.toronto.ca\/dataset\/ward-profiles-2014-2018-wards\/","key":"1054_CR30"},{"doi-asserted-by":"publisher","unstructured":"Pottinger R, Halevy A (2001) Minicon: A scalable algorithm for answering queries using views. VLDB Journal 10. https:\/\/doi.org\/10.1007\/s007780100048","key":"1054_CR31","DOI":"10.1007\/s007780100048"},{"doi-asserted-by":"publisher","unstructured":"Qian X (1996) Query folding, pp. 48\u201355. https:\/\/doi.org\/10.1109\/ICDE.1996.492088","key":"1054_CR32","DOI":"10.1109\/ICDE.1996.492088"},{"doi-asserted-by":"crossref","unstructured":"R\u00e4ssler S (2002) Statistical matching. A frequentist theory, practical applications, and alternative bayesian approaches vol. 168","key":"1054_CR33","DOI":"10.1007\/978-1-4613-0053-3_2"},{"key":"1054_CR34","doi-asserted-by":"publisher","first-page":"10","DOI":"10.1186\/1476-072X-6-10","volume":"6","author":"M Ruiz","year":"2007","unstructured":"Ruiz M, Walker E, Foster E, Haramis L, Kitron U (2007) Association of west Nile virus illness and urban landscapes in Chicago and detroit. Int J Health Geogr 6:10. https:\/\/doi.org\/10.1186\/1476-072X-6-10","journal-title":"Int J Health Geogr"},{"key":"1054_CR35","doi-asserted-by":"publisher","DOI":"10.1080\/01621459.2015.1105807","author":"R Steorts","year":"2014","unstructured":"Steorts R, Hall R, Fienberg S (2014) Smered: A Bayesian approach to graphical record linkage and de-duplication. J Am Stat Assoc. https:\/\/doi.org\/10.1080\/01621459.2015.1105807","journal-title":"J Am Stat Assoc"},{"doi-asserted-by":"publisher","unstructured":"Suciu D, Olteanu D, R\u00e9 C, Koch C (2011) Probabilistic Databases https:\/\/doi.org\/10.2200\/S00362ED1V01Y201105DTM016","key":"1054_CR36","DOI":"10.2200\/S00362ED1V01Y201105DTM016"},{"unstructured":"Survey AC (2014) Chicago Community Data Snapshots. https:\/\/datahub.cmap.illinois.gov\/dataset\/community-data-snapshots-raw-data\/resource\/0873e1e4-5160-4396-a2f6-b3961b88852a?inner_span=True","key":"1054_CR37"},{"unstructured":"Wikipedia: 2014 Toronto Mayoral Election. https:\/\/en.wikipedia.org\/wiki\/2014_Toronto_mayoral_election","key":"1054_CR38"},{"key":"1054_CR39","doi-asserted-by":"publisher","DOI":"10.1002\/wics.1317","author":"W Winkler","year":"2014","unstructured":"Winkler W (2014) Matching and record linkage. Wiley Interdiscip Rev Comput Stat. https:\/\/doi.org\/10.1002\/wics.1317","journal-title":"Wiley Interdiscip Rev Comput Stat"},{"key":"1054_CR40","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2019.2940019","author":"B Zhang","year":"2019","unstructured":"Zhang B, Sanner S, Bouadjenek MR, Gupta S (2019) Bayesian networks for data integration in the absence of foreign keys. IEEE Trans Knowl Data Eng. https:\/\/doi.org\/10.1109\/TKDE.2019.2940019","journal-title":"IEEE Trans Knowl Data Eng"}],"container-title":["Data Mining and Knowledge Discovery"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10618-024-01054-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10618-024-01054-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10618-024-01054-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,28]],"date-time":"2024-10-28T09:12:24Z","timestamp":1730106744000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10618-024-01054-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,8,17]]},"references-count":40,"journal-issue":{"issue":"6","published-print":{"date-parts":[[2024,11]]}},"alternative-id":["1054"],"URL":"https:\/\/doi.org\/10.1007\/s10618-024-01054-7","relation":{},"ISSN":["1384-5810","1573-756X"],"issn-type":[{"type":"print","value":"1384-5810"},{"type":"electronic","value":"1573-756X"}],"subject":[],"published":{"date-parts":[[2024,8,17]]},"assertion":[{"value":"17 October 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"29 June 2024","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 August 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors have no Conflict of interest to declare that are relevant to the content of this article.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}