{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,10]],"date-time":"2026-05-10T08:43:30Z","timestamp":1778402610524,"version":"3.51.4"},"reference-count":32,"publisher":"Springer Science and Business Media LLC","issue":"1","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Knowl Inf Syst"],"published-print":{"date-parts":[[2012,10]]},"DOI":"10.1007\/s10115-011-0463-8","type":"journal-article","created":{"date-parts":[[2011,12,3]],"date-time":"2011-12-03T08:18:44Z","timestamp":1322900324000},"page":"1-33","source":"Crossref","is-referenced-by-count":932,"title":["Data preprocessing techniques for classification without discrimination"],"prefix":"10.1007","volume":"33","author":[{"given":"Faisal","family":"Kamiran","sequence":"first","affiliation":[]},{"given":"Toon","family":"Calders","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2011,12,3]]},"reference":[{"key":"463_CR1","unstructured":"Asuncion A, Newman D (2007) UCI machine learning repository"},{"key":"463_CR2","unstructured":"Attorney-General\u2019s Department C (1984) Australian sex discrimination act 1984. via. http:\/\/www.comlaw.gov.au\/Details\/C2010C00056"},{"key":"463_CR3","doi-asserted-by":"crossref","unstructured":"Calders T, Kamiran F, Pechenizkiy M (2009) Building classifiers with independency constraints. In: IEEE ICDM workshop on domain driven data mining. IEEE press","DOI":"10.1109\/ICDMW.2009.83"},{"issue":"2","key":"463_CR4","doi-asserted-by":"crossref","first-page":"277","DOI":"10.1007\/s10618-010-0190-x","volume":"21","author":"T Calders","year":"2010","unstructured":"Calders T, Verwer S (2010) Three naive bayes approaches for discrimination- free classification. Data Min Knowl Discov 21(2): 277\u2013292","journal-title":"Data Min Knowl Discov"},{"key":"463_CR5","unstructured":"Chan PK, Stolfo SJ (1998) Toward scalable learning with non-uniform class and cost distributions: a case study in credit card fraud detection. In: Proceedings of ACM SIGKDD conference on knowledge discovery and data mining, pp 164\u2013168"},{"key":"463_CR6","volume-title":"Women in the labor force: a databook","author":"EL Chao","year":"2007","unstructured":"Chao EL, Rones PL (2007) Women in the labor force: a databook. US Department of Labor and Bureau of Labor Statistics, Washington, DC"},{"key":"463_CR7","doi-asserted-by":"crossref","first-page":"321","DOI":"10.1613\/jair.953","volume":"16","author":"NV Chawla","year":"2002","unstructured":"Chawla NV, Bowyer KW, Hall LO, Kegelmeyer WP (2002) Smote: synthetic minority over-sampling technique. J Artif Intell Res 16: 321\u2013357","journal-title":"J Artif Intell Res"},{"key":"463_CR8","doi-asserted-by":"crossref","unstructured":"Chawla NV, Hall LO, Joshi A (2005) Wrapper-based computation and evaluation of sampling methods for imbalanced datasets","DOI":"10.1145\/1089827.1089830"},{"key":"463_CR9","doi-asserted-by":"crossref","unstructured":"Domingos P (1999) Metacost: a general method for making classifiers cost-sensitive. In: Proceedings of ACM SIGKDD conference on knowledge discovery and data mining, pp 155\u2013164","DOI":"10.1145\/312129.312220"},{"key":"463_CR10","doi-asserted-by":"crossref","unstructured":"Duivesteijn W, Feelders A (2008) Nearest neighbour classification with monotonicity constraints. In: Proceedings of ECML\/PKDD European conference on machine learning and principles and practice of knowledge discovery in databases. Springer, pp 301\u2013316","DOI":"10.1007\/978-3-540-87479-9_38"},{"key":"463_CR11","unstructured":"Dutch Central Bureau for Statistics (2001) Volkstelling. http:\/\/easy.dans.knaw.nl\/dms"},{"key":"463_CR12","unstructured":"Elkan C (2001) The foundations of cost-sensitive learning. In: Proceedings of IJCAI international joint conference on artificial intelligence, pp 973\u2013978"},{"key":"463_CR13","doi-asserted-by":"crossref","unstructured":"Kamiran F, Calders T (2009a) Classifying without discriminating. In: Proceedings of IEEE IC4 international conference on computer, Control & Communication. IEEE press","DOI":"10.1109\/IC4.2009.4909197"},{"key":"463_CR14","unstructured":"Kamiran F, Calders T (2009b) Discrimination-aware classification. In: BNAIC Benelux conference on artificial intelligence"},{"key":"463_CR15","unstructured":"Kamiran F, Calders T, Pechenizkiy M (2010) Constructing decision trees under non-discriminatory constraints. In: Proceedings of IEEE ICDM international conference on data Mining. IEEE press"},{"issue":"1\u20132","key":"463_CR16","doi-asserted-by":"crossref","first-page":"273","DOI":"10.1016\/S0004-3702(97)00043-X","volume":"97","author":"R Kohavi","year":"1997","unstructured":"Kohavi R, John GH (1997) Wrappers for feature subset selection. Artif Intell 97(1\u20132): 273\u2013324","journal-title":"Artif Intell"},{"issue":"2","key":"463_CR17","first-page":"1","volume":"24","author":"S Koknar-Tezel","year":"2010","unstructured":"Koknar-Tezel S, Latecki L (2010) Improving SVM classification on imbalanced time series data sets with ghost points. Knowl Inf Syst 24(2): 1\u201323","journal-title":"Knowl Inf Syst"},{"key":"463_CR18","unstructured":"Kotlowski W, Dembczynski K, Greco S, Slowinski R (2007) Statistical model for rough set approach to multicriteria classification. In: Proceedings of ECML\/PKDD European conference on machine learning and principles and practice of knowledge discovery in databases. Springer"},{"key":"463_CR19","doi-asserted-by":"crossref","unstructured":"Luong B, Ruggieri S, Turini F (2011) k-nn as an implementation of situation testing for discrimination discovery and prevention. Technical Report TR-11-04, Dipartimento di Informatica, Universita di Pisa","DOI":"10.1145\/2020408.2020488"},{"key":"463_CR20","unstructured":"Margineantu D, Dietterich T (1999) Learning decision trees for loss minimization in multi-class problems. Technical report. Department of Computer Science, Oregon State University"},{"key":"463_CR21","doi-asserted-by":"crossref","unstructured":"Pedreschi D, Ruggieri S, Turini F (2008) Discrimination-aware data mining. In: Proceedings of ACM SIGKDD conference on knowledge discovery and data mining","DOI":"10.1145\/1401890.1401959"},{"key":"463_CR22","doi-asserted-by":"crossref","unstructured":"Pedreschi D, Ruggieri S, Turini F (2009) Measuring discrimination in socially-sensitive decision records. In: Proceedings of SIAM conference on data mining","DOI":"10.1137\/1.9781611972795.50"},{"key":"463_CR23","doi-asserted-by":"crossref","unstructured":"Ruggieri S, Pedreschi D, Turini F (2010a) Dcube: discrimination discovery in databases. In: Proceedings of ACM SIGMOD international conference on management of data, pp 1127\u20131130","DOI":"10.1145\/1807167.1807298"},{"key":"463_CR24","doi-asserted-by":"crossref","unstructured":"Ruggieri S, Pedreschi D, Turini F (2010b) Integrating induction and deduction for finding evidence of discrimination. Artif Intell Law, 1\u201343","DOI":"10.1007\/s10506-010-9089-5"},{"key":"463_CR25","unstructured":"The European Court of Justice E (2011) The European court of justice ruling. via. http:\/\/ec.europa.eu\/ireland\/press_office\/news_of_the_day\/ecj-ruling-sex-discrimination-in-insurance-contracts_en.htm"},{"key":"463_CR26","unstructured":"The US department of Justice U (2011) The us federal legislation. via. http:\/\/www.justice.gov\/crt"},{"key":"463_CR27","doi-asserted-by":"crossref","unstructured":"Turner M, Skidmore F (1999) Mortgage lending discrimination: a review of existing evidence. Urban Institute Monograph Series on Race and Discrimination. Urban Institute Press","DOI":"10.1037\/e721552011-001"},{"key":"463_CR28","unstructured":"Turney P (2000) Cost-sensitive learning bibliography. Institute for Information Technology, National Research Council, Ottawa"},{"key":"463_CR29","unstructured":"US Department of Justice U (1974) Us equal credit opportunity act. via. http:\/\/www.fdic.gov\/regulations\/laws\/rules\/6500-1200.html"},{"key":"463_CR30","unstructured":"US Empl. Opp. Comm. E (1963) Us equal pay act. via. http:\/\/www.eeoc.gov\/laws\/statutes\/epa.cfm"},{"key":"463_CR31","unstructured":"Wang B, Japkowicz N (2009) Boosting support vector machines for imbalanced data Sets. Knowl Inf Syst, 1\u201320"},{"key":"463_CR32","doi-asserted-by":"crossref","unstructured":"Wang H, Wang S (2010) Mining incomplete survey data through classification. Knowl Inf Syst, 1\u201313","DOI":"10.1007\/s10115-009-0198-y"}],"container-title":["Knowledge and Information Systems"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10115-011-0463-8","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,6,20]],"date-time":"2019-06-20T06:51:18Z","timestamp":1561013478000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10115-011-0463-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2011,12,3]]},"references-count":32,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2012,10]]}},"alternative-id":["463"],"URL":"https:\/\/doi.org\/10.1007\/s10115-011-0463-8","relation":{},"ISSN":["0219-1377","0219-3116"],"issn-type":[{"value":"0219-1377","type":"print"},{"value":"0219-3116","type":"electronic"}],"subject":[],"published":{"date-parts":[[2011,12,3]]}}}