{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,1]],"date-time":"2025-08-01T04:03:21Z","timestamp":1754021001624,"version":"3.40.3"},"publisher-location":"Cham","reference-count":38,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783031112164"},{"type":"electronic","value":"9783031112171"}],"license":[{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022]]},"DOI":"10.1007\/978-3-031-11217-1_4","type":"book-chapter","created":{"date-parts":[[2022,7,15]],"date-time":"2022-07-15T21:02:35Z","timestamp":1657918955000},"page":"50-63","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Why Not to\u00a0Trust Big Data: Discussing Statistical Paradoxes"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9024-8768","authenticated-orcid":false,"given":"Rahul","family":"Sharma","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6658-1712","authenticated-orcid":false,"given":"Minakshi","family":"Kaushik","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7858-9463","authenticated-orcid":false,"given":"Sijo Arakkal","family":"Peious","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0034-018X","authenticated-orcid":false,"given":"Mahtab","family":"Shahin","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8026-4246","authenticated-orcid":false,"given":"Ankit","family":"Vidyarthi","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2851-4260","authenticated-orcid":false,"given":"Prayag","family":"Tiwari","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3376-7489","authenticated-orcid":false,"given":"Dirk","family":"Draheim","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2022,7,16]]},"reference":[{"unstructured":"California Department of Developmental Services CDDS expenditures. https:\/\/kaggle.com\/wduckett\/californiaddsexpenditures","key":"4_CR1"},{"unstructured":"Agrawal, R., Srikant, R.: Fast algorithms for mining association rules in large databases. In: Proceedings of VLDB 1994 - The 20th International Conference on Very Large Data Bases, pp. 487\u2013499. Morgan Kaufmann (1994)","key":"4_CR2"},{"doi-asserted-by":"publisher","unstructured":"Alipourfard, N., Fennell, P.G., Lerman, K.: Can you trust the trend? Discovering Simpson\u2019s paradoxes in social data. In: Proceedings of the Eleventh ACM International Conference on Web Search and Data Mining, WSDM 2018, pp. 19\u201327. Association for Computing Machinery, New York (2018). https:\/\/doi.org\/10.1145\/3159652.3159684","key":"4_CR3","DOI":"10.1145\/3159652.3159684"},{"doi-asserted-by":"crossref","unstructured":"Alipourfard, N., Fennell, P.G., Lerman, K.: Using Simpson\u2019s paradox to discover interesting patterns in behavioral data. In: Proceedings of the Twelfth International AAAI Conference on Web and Social Media. AAAI Publications (2018)","key":"4_CR4","DOI":"10.1609\/icwsm.v12i1.15017"},{"doi-asserted-by":"crossref","unstructured":"Berkson, J.: Limitations of the application of fourfold table analysis to hospital data. Biometrics Bull. 2(3), 47\u201353 (1946). http:\/\/www.jstor.org\/stable\/3002000","key":"4_CR5","DOI":"10.2307\/3002000"},{"issue":"338","key":"4_CR6","doi-asserted-by":"publisher","first-page":"364","DOI":"10.1080\/01621459.1972.10482387","volume":"67","author":"CR Blyth","year":"1972","unstructured":"Blyth, C.R.: On Simpson\u2019s paradox and the sure-thing principle. J. Am. Stat. Assoc. 67(338), 364\u2013366 (1972)","journal-title":"J. Am. Stat. Assoc."},{"issue":"1","key":"4_CR7","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1023\/A:1010933404324","volume":"45","author":"L Breiman","year":"2001","unstructured":"Breiman, L.: Random forests. Mach. Learn. 45(1), 5\u201332 (2001)","journal-title":"Mach. Learn."},{"doi-asserted-by":"crossref","unstructured":"Cattell, R.B.: P-technique factorization and the determination of individual dynamic structure. J. Clin. Psychol. (1952)","key":"4_CR8","DOI":"10.1002\/1097-4679(195201)8:1<5::AID-JCLP2270080103>3.0.CO;2-S"},{"doi-asserted-by":"publisher","unstructured":"Commission, E., Centre, J.R., Wenzl, T.: Smoking and COVID-19: a review of studies suggesting a protective effect of smoking against COVID-19. Publications Office (2020). https:\/\/doi.org\/10.2760\/564217","key":"4_CR9","DOI":"10.2760\/564217"},{"issue":"1","key":"4_CR10","doi-asserted-by":"publisher","first-page":"35","DOI":"10.1177\/001316447403400105","volume":"34","author":"AJ Conger","year":"1974","unstructured":"Conger, A.J.: A revised definition for suppressor variables: a guide to their identification and interpretation. Educ. Psychol. Measur. 34(1), 35\u201346 (1974)","journal-title":"Educ. Psychol. Measur."},{"issue":"3","key":"4_CR11","doi-asserted-by":"publisher","first-page":"273","DOI":"10.1007\/BF00994018","volume":"20","author":"C Cortes","year":"1995","unstructured":"Cortes, C., Vapnik, V.: Support-vector networks. Mach. Learn. 20(3), 273\u2013297 (1995)","journal-title":"Mach. Learn."},{"issue":"1","key":"4_CR12","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1111\/j.2517-6161.1979.tb01052.x","volume":"41","author":"AP Dawid","year":"1979","unstructured":"Dawid, A.P.: Conditional independence in statistical theory. J. Roy. Stat. Soc.: Ser. B (Methodol.) 41(1), 1\u201315 (1979). https:\/\/doi.org\/10.1111\/j.2517-6161.1979.tb01052.x","journal-title":"J. Roy. Stat. Soc.: Ser. B (Methodol.)"},{"unstructured":"Draheim, D.: DEXA\u20192019 keynote presentation: future perspectives of association rule mining based on partial conditionalization, Linz, Austria, 28th August 2019. https:\/\/doi.org\/10.13140\/RG.2.2.17763.48163","key":"4_CR13"},{"unstructured":"Draheim, D.: Future perspectives of association rule mining based on partial conditionalization. In: Hartmann, S., K\u00fcng, J., Chakravarthy, S., Anderst-Kotsis, G., A Min Tjoa, Khalil, I. (eds.) Database and Expert Systems Applications. LNCS, vol. 11706, p.\u00a0xvi. Springer, Heidelberg (2019)(2019)","key":"4_CR14"},{"issue":"2","key":"4_CR15","doi-asserted-by":"publisher","first-page":"179","DOI":"10.1111\/j.1469-1809.1936.tb02137.x","volume":"7","author":"RA Fisher","year":"1936","unstructured":"Fisher, R.A.: The use of multiple measurement in taxonomic problems. Ann. Eugen. 7(2), 179\u2013188 (1936). https:\/\/doi.org\/10.1111\/j.1469-1809.1936.tb02137.x","journal-title":"Ann. Eugen."},{"doi-asserted-by":"crossref","unstructured":"Fisher, R.A.: III. The influence of rainfall on the yield of wheat at rothamsted. Philos. Trans. R. Soc. London Ser. B Containing Papers Biological Character 213(402\u2013410), 89\u2013142 (1925)","key":"4_CR16","DOI":"10.1098\/rstb.1925.0003"},{"unstructured":"Freitas, A.A., McGarry, K.J., Correa, E.S.: Integrating Bayesian networks and Simpson\u2019s paradox in data mining. In: Texts in Philosophy. College Publications (2007)","key":"4_CR17"},{"issue":"1","key":"4_CR18","doi-asserted-by":"publisher","first-page":"5749","DOI":"10.1038\/s41467-020-19478-2","volume":"11","author":"GJ Griffith","year":"2020","unstructured":"Griffith, G.J., et al.: Collider bias undermines our understanding of COVID-19 disease risk and severity. Nat. Commun. 11(1), 5749 (2020). https:\/\/doi.org\/10.1038\/s41467-020-19478-2","journal-title":"Nat. Commun."},{"key":"4_CR19","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"244","DOI":"10.1007\/978-3-030-93620-4_18","volume-title":"Big Data Analytics","author":"M Kaushik","year":"2021","unstructured":"Kaushik, M., Sharma, R., Peious, S.A., Draheim, D.: Impact-driven discretization of\u00a0numerical factors: case of\u00a0two- and\u00a0three-partitioning. In: Srirama, S.N., Lin, J.C.-W., Bhatnagar, R., Agarwal, S., Reddy, P.K. (eds.) BDA 2021. LNCS, vol. 13147, pp. 244\u2013260. Springer, Cham (2021). https:\/\/doi.org\/10.1007\/978-3-030-93620-4_18"},{"key":"4_CR20","series-title":"Communications in Computer and Information Science","doi-asserted-by":"publisher","first-page":"3","DOI":"10.1007\/978-981-33-4370-2_1","volume-title":"Future Data and Security Engineering. Big Data, Security and Privacy, Smart City and Industry 4.0 Applications","author":"M Kaushik","year":"2020","unstructured":"Kaushik, M., Sharma, R., Peious, S.A., Shahin, M., Ben Yahia, S., Draheim, D.: On the potential of numerical association rule mining. In: Dang, T.K., K\u00fcng, J., Takizawa, M., Chung, T.M. (eds.) FDSE 2020. CCIS, vol. 1306, pp. 3\u201320. Springer, Singapore (2020). https:\/\/doi.org\/10.1007\/978-981-33-4370-2_1"},{"issue":"5","key":"4_CR21","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s42979-021-00725-2","volume":"2","author":"M Kaushik","year":"2021","unstructured":"Kaushik, M., Sharma, R., Peious, S.A., Shahin, M., Yahia, S.B., Draheim, D.: A systematic assessment of numerical association rule mining methods. SN Comput. Sci. 2(5), 1\u201313 (2021). https:\/\/doi.org\/10.1007\/s42979-021-00725-2","journal-title":"SN Comput. Sci."},{"key":"4_CR22","doi-asserted-by":"publisher","first-page":"513","DOI":"10.3389\/fpsyg.2013.00513","volume":"4","author":"R Kievit","year":"2013","unstructured":"Kievit, R., Frankenhuis, W., Waldorp, L., Borsboom, D.: Simpson\u2019s paradox in psychological science: a practical guide. Front. Psychol. 4, 513 (2013). https:\/\/doi.org\/10.3389\/fpsyg.2013.00513","journal-title":"Front. Psychol."},{"issue":"3","key":"4_CR23","doi-asserted-by":"publisher","first-page":"307","DOI":"10.1080\/00031305.2020.1790216","volume":"74","author":"Y Kim","year":"2020","unstructured":"Kim, Y.: The 9 pitfalls of data science. Am. Stat. 74(3), 307\u2013307 (2020). https:\/\/doi.org\/10.1080\/00031305.2020.1790216","journal-title":"Am. Stat."},{"unstructured":"King, G., Roberts, M.: EI: A (n R) program for ecological inference. Harvard University (2012)","key":"4_CR24"},{"doi-asserted-by":"publisher","unstructured":"Ma, H.Y., Lin, D.K.J.: Effect of Simpson\u2019s paradox on market basket analysis. J. Chin. Stat. Assoc. 42(2), 209\u2013221 (2004). https:\/\/doi.org\/10.29973\/JCSA.200406.0007","key":"4_CR25","DOI":"10.29973\/JCSA.200406.0007"},{"doi-asserted-by":"publisher","unstructured":"MacKinnon, D.P., Fairchild, A.J., Fritz, M.S.: Mediation analysis. Annu. Rev. Psychol. 58(1), 593\u2013614 (2007). https:\/\/doi.org\/10.1146\/annurev.psych.58.110405.085542. pMID: 16968208","key":"4_CR26","DOI":"10.1146\/annurev.psych.58.110405.085542"},{"issue":"450","key":"4_CR27","first-page":"428","volume":"95","author":"J Pearl","year":"2000","unstructured":"Pearl, J.: Causal inference without counterfactuals: comment. J. Am. Stat. Assoc. 95(450), 428\u2013431 (2000)","journal-title":"J. Am. Stat. Assoc."},{"doi-asserted-by":"publisher","unstructured":"Pearl, J.: Understanding Simpson\u2019s paradox. SSRN Electron. J. 68 (2013). https:\/\/doi.org\/10.2139\/ssrn.2343788","key":"4_CR28","DOI":"10.2139\/ssrn.2343788"},{"key":"4_CR29","doi-asserted-by":"publisher","first-page":"257","DOI":"10.1098\/rsta.1899.0006","volume":"192","author":"LA Pearson Karl","year":"1899","unstructured":"Pearson Karl, L.A., Leslie, B.M.: Genetic (reproductive) selection: inheritance of fertility in man, and of fecundity in thoroughbred racehorses. Philos. Trans. R. Soc. Lond. Ser. A 192, 257\u2013330 (1899)","journal-title":"Philos. Trans. R. Soc. Lond. Ser. A"},{"doi-asserted-by":"publisher","unstructured":"Quinlan, J.: Combining instance-based and model-based learning. In: Machine Learning Proceedings 1993, pp. 236\u2013243. Elsevier (1993). https:\/\/doi.org\/10.1016\/B978-1-55860-307-3.50037-X","key":"4_CR30","DOI":"10.1016\/B978-1-55860-307-3.50037-X"},{"issue":"3","key":"4_CR31","doi-asserted-by":"publisher","first-page":"351","DOI":"10.2307\/2087176","volume":"15","author":"WS Robinson","year":"1950","unstructured":"Robinson, W.S.: Ecological correlations and the behavior of individuals. Am. Sociol. Rev. 15(3), 351\u2013357 (1950)","journal-title":"Am. Sociol. Rev."},{"issue":"1","key":"4_CR32","doi-asserted-by":"publisher","first-page":"41","DOI":"10.1093\/biomet\/70.1.41","volume":"70","author":"PR Rosenbaum","year":"1983","unstructured":"Rosenbaum, P.R., Rubin, D.B.: The central role of the propensity score in observational studies for causal effects. Biometrika 70(1), 41\u201355 (1983)","journal-title":"Biometrika"},{"issue":"2","key":"4_CR33","doi-asserted-by":"crossref","first-page":"238","DOI":"10.1111\/j.2517-6161.1951.tb00088.x","volume":"13","author":"EH Simpson","year":"1951","unstructured":"Simpson, E.H.: The interpretation of interaction in contingency tables. J. Roy. Stat. Soc.: Ser. B (Methodol.) 13(2), 238\u2013241 (1951)","journal-title":"J. Roy. Stat. Soc.: Ser. B (Methodol.)"},{"doi-asserted-by":"crossref","unstructured":"Srikant, R., Agrawal, R.: Mining quantitative association rules in large relational tables. In: Proceedings of the 1996 ACM SIGMOD International Conference on Management of Data, pp. 1\u201312 (1996)","key":"4_CR34","DOI":"10.1145\/235968.233311"},{"issue":"1","key":"4_CR35","doi-asserted-by":"publisher","first-page":"8","DOI":"10.1080\/10691898.2014.11889697","volume":"22","author":"SA Taylor","year":"2014","unstructured":"Taylor, S.A., Mickel, A.E.: Simpson\u2019s paradox: a data set and discrimination case study exercise. J. Stat. Educ. 22(1), 8 (2014). https:\/\/doi.org\/10.1080\/10691898.2014.11889697","journal-title":"J. Stat. Educ."},{"issue":"1","key":"4_CR36","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/1742-7622-5-2","volume":"5","author":"YK Tu","year":"2008","unstructured":"Tu, Y.K., Gunnell, D., Gilthorpe, M.S.: Simpson\u2019s paradox, lord\u2019s paradox, and suppression effects are the same phenomenon-the reversal paradox. Emerg. Themes Epidemiol. 5(1), 1\u20139 (2008)","journal-title":"Emerg. Themes Epidemiol."},{"issue":"1","key":"4_CR37","doi-asserted-by":"publisher","first-page":"18","DOI":"10.1109\/tai.2021.3073088","volume":"2","author":"J Von Kugelgen","year":"2021","unstructured":"Von Kugelgen, J., Gresele, L., Scholkopf, B.: Simpson\u2019s paradox in COVID-19 case fatality rates: a mediation analysis of age-related causal effects. IEEE Trans. Artif. Intell. 2(1), 18\u201327 (2021). https:\/\/doi.org\/10.1109\/tai.2021.3073088","journal-title":"IEEE Trans. Artif. Intell."},{"issue":"2","key":"4_CR38","doi-asserted-by":"publisher","first-page":"121","DOI":"10.1093\/biomet\/2.2.121","volume":"2","author":"GU Yule","year":"1903","unstructured":"Yule, G.U.: Notes on the theory of association of attributes in statistics. Biometrika 2(2), 121\u2013134 (1903)","journal-title":"Biometrika"}],"container-title":["Lecture Notes in Computer Science","Database Systems for Advanced Applications. DASFAA 2022 International Workshops"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-11217-1_4","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,29]],"date-time":"2024-09-29T06:42:54Z","timestamp":1727592174000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-11217-1_4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022]]},"ISBN":["9783031112164","9783031112171"],"references-count":38,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-11217-1_4","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2022]]},"assertion":[{"value":"16 July 2022","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"DASFAA","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Database Systems for Advanced Applications","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2022","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"11 April 2022","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"14 April 2022","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"27","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"dasfaa2022","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/www.dasfaa2022.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"CMT","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"543","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"72","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"76","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"13% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"6","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Conference was originally planned to take place in Hyberabad, India. 24 other papers are included in the volume.","order":10,"name":"additional_info_on_review_process","label":"Additional Info on Review Process","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}