{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,11]],"date-time":"2026-06-11T16:58:35Z","timestamp":1781197115492,"version":"3.54.1"},"publisher-location":"Cham","reference-count":34,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783319463063","type":"print"},{"value":"9783319463070","type":"electronic"}],"license":[{"start":{"date-parts":[[2016,1,1]],"date-time":"2016-01-01T00:00:00Z","timestamp":1451606400000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016]]},"DOI":"10.1007\/978-3-319-46307-0_21","type":"book-chapter","created":{"date-parts":[[2016,9,20]],"date-time":"2016-09-20T07:47:42Z","timestamp":1474357662000},"page":"325-340","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":10,"title":["On Selection Bias with Imbalanced Classes"],"prefix":"10.1007","author":[{"given":"Gert","family":"Jacobusse","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Cor","family":"Veenman","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2016,9,21]]},"reference":[{"issue":"7","key":"21_CR1","doi-asserted-by":"publisher","first-page":"1145","DOI":"10.1016\/S0031-3203(96)00142-2","volume":"30","author":"A Bradley","year":"1997","unstructured":"Bradley, A.: The use of the area under the ROC curve in the evaluation of machine learning algorithms. Pattern Recogn. 30(7), 1145\u20131159 (1997)","journal-title":"Pattern Recogn."},{"issue":"1","key":"21_CR2","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1023\/A:1010933404324","volume":"45","author":"L Breiman","year":"2001","unstructured":"Breiman, L.: Random forests. Mach. Learn. 45(1), 5\u201332 (2001)","journal-title":"Mach. Learn."},{"key":"21_CR3","doi-asserted-by":"crossref","unstructured":"Chapelle, O., Sch\u00f6lkopf, B., Zien, A.: Semi-supervised Learning (2006)","DOI":"10.7551\/mitpress\/9780262033589.001.0001"},{"key":"21_CR4","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"465","DOI":"10.1007\/978-3-642-34487-9_56","volume-title":"Neural Information Processing","author":"S Chaudhari","year":"2012","unstructured":"Chaudhari, S., Shevade, S.: Learning from positive and unlabelled examples using maximum margin clustering. In: Huang, T., Zeng, Z., Li, C., Leung, C.S. (eds.) ICONIP 2012. LNCS, vol. 7665, pp. 465\u2013473. Springer, Heidelberg (2012). doi:10.1007\/978-3-642-34487-9_56"},{"key":"21_CR5","unstructured":"Chen, C., Liaw, A., Breiman, L.: Using Random Forest to Learn Imbalanced Data. Technical report, Department of Statistics, University of Berkeley (2004)"},{"key":"21_CR6","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"38","DOI":"10.1007\/978-3-540-87987-9_8","volume-title":"Algorithmic Learning Theory","author":"C Cortes","year":"2008","unstructured":"Cortes, C., Mohri, M., Riley, M., Rostamizadeh, A.: Sample selection bias correction theory. In: Freund, Y., Gy\u00f6rfi, L., Tur\u00e1n, G., Zeugmann, T. (eds.) ALT 2008. LNCS (LNAI), vol. 5254, pp. 38\u201353. Springer, Heidelberg (2008). doi:10.1007\/978-3-540-87987-9_8"},{"key":"21_CR7","volume-title":"Pattern Classification","author":"R Duda","year":"2001","unstructured":"Duda, R., Hart, P., Stork, D.: Pattern Classification. John Wiley and Sons Inc., New York (2001)"},{"key":"21_CR8","unstructured":"Elkan, C.: The foundations of cost-sensitive learning. In: Proceedings of the 17th International Joint Conference on Artificial Intelligence, IJCAI 2001, vol. 2, pp. 973\u2013978 (2001)"},{"key":"21_CR9","doi-asserted-by":"crossref","unstructured":"Elkan, C., Noto, K.: Learning classifiers from only positive and unlabeled data. In: Proceedings of the 14th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, KDD 2008, pp. 213\u2013220. ACM, New York (2008)","DOI":"10.1145\/1401890.1401920"},{"key":"21_CR10","first-page":"1871","volume":"9","author":"RE Fan","year":"2008","unstructured":"Fan, R.E., Chang, K.W., Hsieh, C.J., Wang, X.R., Lin, C.J.: LIBLINEAR: a library for large linear classification. J. Mach. Learn. Res. 9, 1871\u20131874 (2008)","journal-title":"J. Mach. Learn. Res."},{"key":"21_CR11","doi-asserted-by":"publisher","first-page":"291","DOI":"10.1023\/A:1009700419189","volume":"1","author":"T Fawcett","year":"1997","unstructured":"Fawcett, T., Provost, F.: Adaptive fraud detection. Data Min. Knowl. Disc. 1, 291\u2013316 (1997)","journal-title":"Data Min. Knowl. Disc."},{"key":"21_CR12","doi-asserted-by":"crossref","unstructured":"Friedman, J.H.: Greedy function approximation: a gradient boosting machine (2000)","DOI":"10.1214\/aos\/1013203451"},{"key":"21_CR13","doi-asserted-by":"crossref","unstructured":"Guo, X., Yin, Y., Dong, C., Yang, G., Zhou, G.: On the class imbalance problem. In: 2008 Fourth International Conference on Natural Computation, ICNC 2008, vol. 4, pp. 192\u2013201. IEEE (2008)","DOI":"10.1109\/ICNC.2008.871"},{"issue":"9","key":"21_CR14","doi-asserted-by":"publisher","first-page":"1263","DOI":"10.1109\/TKDE.2008.239","volume":"21","author":"H He","year":"2009","unstructured":"He, H., Garcia, E.: Learning from imbalanced data. IEEE Trans. Knowl. Data Eng. 21(9), 1263\u20131284 (2009)","journal-title":"IEEE Trans. Knowl. Data Eng."},{"issue":"4","key":"21_CR15","doi-asserted-by":"publisher","first-page":"493","DOI":"10.1007\/s11280-013-0215-7","volume":"17","author":"H Hu","year":"2014","unstructured":"Hu, H., Sha, C., Wang, X., Zhou, A.: A unified framework for semi-supervised PU learning. World Wide Web 17(4), 493\u2013510 (2014)","journal-title":"World Wide Web"},{"key":"21_CR16","doi-asserted-by":"crossref","unstructured":"Huang, J., Smola, A., Gretton, A., Borgwardt, K., Scholkopf, B.: Correcting sample selection bias by unlabeled data. In: Advances in Neural Information Processing Systems, vol. 19, p. 601 (2007)","DOI":"10.7551\/mitpress\/7503.003.0080"},{"issue":"5","key":"21_CR17","doi-asserted-by":"crossref","first-page":"429","DOI":"10.3233\/IDA-2002-6504","volume":"6","author":"N Japkowicz","year":"2002","unstructured":"Japkowicz, N., Stephen, S.: The class imbalance problem: a systematic study. Intell. Data Anal. 6(5), 429\u2013449 (2002)","journal-title":"Intell. Data Anal."},{"key":"21_CR18","unstructured":"Kubat, M., Matwin, S.: Addressing the curse of imbalanced training sets: one-sided selection. In: Proceedings of the Fourteenth International Conference on Machine Learning (ICML), pp. 179\u2013186. Morgan Kaufmann (1997)"},{"key":"21_CR19","doi-asserted-by":"crossref","unstructured":"Li, H., Chen, Z., Liu, B., Wei, X., Shao, J.: Spotting fake reviews via collective positive-unlabeled learning. In: IEEE International Conference on Data Mining (ICDM 2014) (2014)","DOI":"10.1109\/ICDM.2014.47"},{"issue":"24","key":"21_CR20","doi-asserted-by":"publisher","first-page":"3310","DOI":"10.1093\/bioinformatics\/btp589","volume":"25","author":"Q Li","year":"2009","unstructured":"Li, Q., Wang, Y., Bryant, S.: A novel method for mining highly imbalanced high-throughput screening data in PubChem. Bioinformatics 25(24), 3310\u20133316 (2009)","journal-title":"Bioinformatics"},{"key":"21_CR21","doi-asserted-by":"publisher","DOI":"10.1002\/9781119013563","volume-title":"Statistical Analysis with Missing Data","author":"RJA Little","year":"2002","unstructured":"Little, R.J.A., Rubin, D.B.: Statistical Analysis with Missing Data. Wiley, New York (2002)"},{"key":"21_CR22","unstructured":"Liu, A., Ziebart, B.: Robust classification under sample selection bias. In: Advances in Neural Information Processing Systems 27: Annual Conference on Neural Information Processing Systems 2014, Montreal, Quebec, Canada, 8\u201313 December 2014, pp. 37\u201345 (2014)"},{"key":"21_CR23","doi-asserted-by":"crossref","first-page":"141","DOI":"10.1016\/j.neunet.2011.07.002","volume":"25","author":"Jordan M. Malof","year":"2012","unstructured":"Malof, J., Mazurowski, M., Tourassib, G.: The effect of class imbalance on case selection for case-based classifiers: an empirical study in the context of medical decision support. Neural Netw. 25(1), January 2012","journal-title":"Neural Networks"},{"key":"21_CR24","unstructured":"Mansour, Y., Mohri, M., Rostamizadeh, A.: Domain adaptation: learning bounds and algorithms. CoRR"},{"key":"21_CR25","unstructured":"du\u00a0Plessis, M., Niu, G., Sugiyama, M.: Analysis of learning from positive andunlabeled data. In: Advances in Neural Information Processing Systems 27: Annual Conference on Neural Information Processing Systems, Montreal, Quebec, Canada, 8\u201313 December 2014, pp. 703\u2013711 (2014)"},{"issue":"2","key":"21_CR26","doi-asserted-by":"publisher","first-page":"147","DOI":"10.1023\/A:1010968702992","volume":"45","author":"M Ramoni","year":"2001","unstructured":"Ramoni, M., Sebastiani, P.: Robust learning with missing data. Mach. Learn. 45(2), 147\u2013170 (2001)","journal-title":"Mach. Learn."},{"issue":"2","key":"21_CR27","doi-asserted-by":"publisher","first-page":"227","DOI":"10.1016\/S0378-3758(00)00115-4","volume":"90","author":"H Shimodaira","year":"2000","unstructured":"Shimodaira, H.: Improving predictive inference under covariate shift by weighting the log-likelihood function. J. Stat. Plann. Infer. 90(2), 227\u2013244 (2000)","journal-title":"J. Stat. Plann. Infer."},{"key":"21_CR28","doi-asserted-by":"crossref","unstructured":"Van\u00a0Vlasselaer, V., Akoglu, L., Eliassi-Rad, T., Snoeck, M., Baesens, B.: Guilt-by-constellation: fraud detection by suspicious clique memberships. In: 2015 48th Hawaii International Conference on System Sciences (HICSS), pp. 918\u2013927. IEEE, January 2015","DOI":"10.1109\/HICSS.2015.114"},{"key":"21_CR29","doi-asserted-by":"crossref","unstructured":"Varshney, K., Chenthamarakshan, V., Fancher, S., Wang, J., Fang, D., Mojsilovi\u0107, A.: Predicting employee expertise for talent management in the enterprise. In: Proceedings of the 20th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, KDD 2014, pp. 1729\u20131738. ACM, New York (2014)","DOI":"10.1145\/2623330.2623337"},{"key":"21_CR30","doi-asserted-by":"crossref","unstructured":"Veenman, C.: Data base investigation as a ranking problem. In: Proceedings of the European Intelligence and Security Informatics Conference (EISIC), Odense, Denmark, 21\u201324 August 2012","DOI":"10.1109\/EISIC.2012.44"},{"key":"21_CR31","unstructured":"Visa, S., Ralescu, A.: Issues in mining imbalanced data sets - a review paper. In: Proceedings of the Sixteen Midwest Artificial Intelligence and Cognitive Science Conference, pp. 67\u201373 (2005)"},{"key":"21_CR32","doi-asserted-by":"crossref","unstructured":"Zadrozny, B.: Learning and evaluating classifiers under sample selection bias. In: Proceedings of the Twenty-First International Conference on Machine Learning, ICML 2004, p. 114. ACM, New York (2004)","DOI":"10.1145\/1015330.1015425"},{"key":"21_CR33","unstructured":"Zhou, J., Pan, S., Mao, Q., Tsang, I.: Multi-view positive and unlabeled learning. In: Proceedings of the 4th Asian Conference on Machine Learning, ACML 2012, Singapore, Singapore, 4\u20136 November 2012, pp. 555\u2013570 (2012)"},{"key":"21_CR34","unstructured":"Zhu, X.: Semi-supervised learning literature survey. Technical report (2006)"}],"container-title":["Lecture Notes in Computer Science","Discovery Science"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-46307-0_21","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,12]],"date-time":"2024-03-12T12:08:32Z","timestamp":1710245312000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-319-46307-0_21"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016]]},"ISBN":["9783319463063","9783319463070"],"references-count":34,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-46307-0_21","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2016]]},"assertion":[{"value":"21 September 2016","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"DS","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Discovery Science","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Bari","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2016","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"19 October 2016","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"21 October 2016","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"19","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"dis2016","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}