{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T19:39:12Z","timestamp":1740166752599,"version":"3.37.3"},"reference-count":30,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2019,4,4]],"date-time":"2019-04-04T00:00:00Z","timestamp":1554336000000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Netw Model Anal Health Inform Bioinforma"],"published-print":{"date-parts":[[2019,12]]},"DOI":"10.1007\/s13721-019-0186-4","type":"journal-article","created":{"date-parts":[[2019,4,5]],"date-time":"2019-04-05T13:47:01Z","timestamp":1554472021000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["Melanoma risk modeling from limited positive samples"],"prefix":"10.1007","volume":"8","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-3269-867X","authenticated-orcid":false,"given":"Aaron N.","family":"Richter","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Taghi M.","family":"Khoshgoftaar","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2019,4,4]]},"reference":[{"key":"186_CR1","unstructured":"American Cancer Society (2019) Cancer facts and figures 2019. \nhttps:\/\/www.cancer.org\/cancer\/melanoma-skin-cancer\/about\/key-statistics.html"},{"issue":"1","key":"186_CR2","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1023\/A:1010933404324","volume":"45","author":"L Breiman","year":"2001","unstructured":"Breiman L (2001) Random forests. Mach Learn 45(1):5\u201332","journal-title":"Mach Learn"},{"key":"186_CR3","doi-asserted-by":"publisher","unstructured":"Chen T, Guestrin C (2016) XGBoost: a scalable tree boosting system. In: Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, pp 785\u2013794. \nhttps:\/\/doi.org\/10.1145\/2939672.2939785","DOI":"10.1145\/2939672.2939785"},{"issue":"2","key":"186_CR4","doi-asserted-by":"publisher","first-page":"105","DOI":"10.1007\/s40747-017-0037-9","volume":"3","author":"A Fern\u00e1ndez","year":"2017","unstructured":"Fern\u00e1ndez A, del R\u00edo S, Chawla NV, Herrera F (2017) An insight into imbalanced big data classification: outcomes and challenges. Complex Intell Syst 3(2):105\u2013120. \nhttps:\/\/doi.org\/10.1007\/s40747-017-0037-9","journal-title":"Complex Intell Syst"},{"issue":"1","key":"186_CR5","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1214\/009053604000001048","volume":"33","author":"Andrew Gelman","year":"2005","unstructured":"Gelman A (2005) Analysis of variance: why it is more important than ever. Ann Stat 33(1):1\u201331. \nhttp:\/\/www.jstor.org\/stable\/3448650","journal-title":"The Annals of Statistics"},{"key":"186_CR6","doi-asserted-by":"publisher","DOI":"10.1002\/9781118548387","volume-title":"Applied logistic regression","author":"DW Hosmer Jr","year":"2013","unstructured":"Hosmer DW Jr, Lemeshow S, Sturdivant RX (2013) Applied logistic regression, vol 398. Wiley, New York"},{"issue":"1","key":"186_CR7","doi-asserted-by":"publisher","first-page":"45","DOI":"10.1016\/S0933-3657(02)00086-6","volume":"27","author":"JM Jerez-Aragon\u00e9s","year":"2003","unstructured":"Jerez-Aragon\u00e9s JM, G\u00f3mez-Ruiz JA, Ramos-Jim\u00e9nez G, Mu\u00f1oz-P\u00e9rez J, Alba-Conejo E (2003) A combined neural network and decision trees model for prognosis of breast cancer relapse. Artif. Intell Med 27(1):45\u201363","journal-title":"Artif. Intell Med"},{"key":"186_CR8","unstructured":"Jones E, Oliphant T, Peterson P et al\u00a0(2001) SciPy: Open source scientific tools for Python. \nhttp:\/\/www.scipy.org\/"},{"issue":"1","key":"186_CR9","first-page":"25","volume":"30","author":"S Kotsiantis","year":"2006","unstructured":"Kotsiantis S, Kanellopoulos D, Pintelas P et al (2006) Handling imbalanced datasets: a review. GESTS Int Trans Comput Sci Eng 30(1):25\u201336","journal-title":"GESTS Int Trans Comput Sci Eng"},{"key":"186_CR10","unstructured":"Lema\u00eetre G, Nogueira F, Aridas CK (2017) Imbalanced-learn: a python toolbox to tackle the curse of imbalanced datasets in machine learning. J Mach Learn Res 18(17):1\u20135. \nhttp:\/\/jmlr.org\/papers\/v18\/16-365"},{"key":"186_CR11","unstructured":"National Cancer Institute (2018) Cancer statistics. \nhttps:\/\/www.cancer.gov\/about-cancer\/understanding\/statistics"},{"issue":"2","key":"186_CR12","doi-asserted-by":"publisher","first-page":"e54,823","DOI":"10.1371\/journal.pone.0054823","volume":"8","author":"S Park","year":"2013","unstructured":"Park S, Nam BH, Yang HR, Lee JA, Lim H, Han JT, Park IS, Shin HR, Lee JS (2013) Individualized risk prediction model for lung cancer in korean men. PLoS One 8(2):e54,823. \nhttps:\/\/doi.org\/10.1371\/journal.pone.0054823","journal-title":"PLoS One"},{"key":"186_CR13","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa F, Varoquaux G, Gramfort A, Michel V, Thirion B, Grisel O, Blondel M, Prettenhofer P, Weiss R, Dubourg V, Vanderplas J, Passos A, Cournapeau D, Brucher M, Perrot M, Duchesnay E (2011) Scikit-learn: machine learning in Python. J Mach Learn Res 12:2825\u20132830","journal-title":"J Mach Learn Res"},{"key":"186_CR14","first-page":"61","volume-title":"Advances in large margin classifiers","author":"JC Platt","year":"1999","unstructured":"Platt JC (1999) Probabilistic outputs for support vector machines and comparisons to regularized likelihood methods. In: Smola AJ,\u00a0Bartlett PJ (eds) Advances in large margin classifiers. MIT Press, Cambridge, pp 61\u201374"},{"key":"186_CR15","doi-asserted-by":"publisher","first-page":"77","DOI":"10.1613\/jair.279","volume":"4","author":"J. R. Quinlan","year":"1996","unstructured":"Quinlan JR (1996) Improved use of continuous attributes in C4.5. J Artif Intell Res 4:77\u201390","journal-title":"Journal of Artificial Intelligence Research"},{"issue":"5","key":"186_CR16","doi-asserted-by":"publisher","first-page":"958","DOI":"10.1002\/cncr.20065","volume":"100","author":"M Radespiel-Tr\u00f6ger","year":"2004","unstructured":"Radespiel-Tr\u00f6ger M, Hohenberger W, Reingruber B (2004) Improved prediction of recurrence after curative resection of colon carcinoma using tree-based risk stratification. Cancer 100(5):958\u2013967. \nhttps:\/\/doi.org\/10.1002\/cncr.20065","journal-title":"Cancer"},{"key":"186_CR17","unstructured":"Rennie JD, Shih L, Teevan J, Karger DR (2003) Tackling the poor assumptions of naive bayes text classifiers. In: Proceedings of the 20th international conference on machine learning (ICML-03), pp 616\u2013623"},{"key":"186_CR18","unstructured":"Richter AN, Khoshgoftaar TM (2017) Modernizing analytics for melanoma with a large-scale research dataset. In: IEEE 18th International Conference on Information Reuse and Integration (IRI), 2017"},{"key":"186_CR19","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.artmed.2018.06.002","volume":"90","author":"Aaron N. Richter","year":"2018","unstructured":"Richter AN, Khoshgoftaar TM (2018) A review of statistical and machine learning methods for modeling cancer risk using structured clinical data. Artif Intell Med. \nhttps:\/\/doi.org\/10.1016\/j.artmed.2018.06.002","journal-title":"Artificial Intelligence in Medicine"},{"key":"186_CR20","doi-asserted-by":"publisher","unstructured":"Seiffert C, Khoshgoftaar TM, Hulse JV, Napolitano A (2007) Mining data with rare events: a case study. In: Proceedings of the 19th IEEE international conference on tools with artificial intelligence, vol 2, IEEE Computer Society, Washington, DC, USA, ICTAI \u201907, pp 132\u2013139. \nhttps:\/\/doi.org\/10.1109\/ICTAI.2007.130","DOI":"10.1109\/ICTAI.2007.130"},{"key":"186_CR21","doi-asserted-by":"crossref","unstructured":"Seiffert C, Khoshgoftaar TM, Van Hulse J, Napolitano A (2008) A comparative study of data sampling and cost sensitive learning. In: IEEE International Conference on Data Mining Workshops, pp 46\u201352","DOI":"10.1109\/ICDMW.2008.119"},{"issue":"12","key":"186_CR22","doi-asserted-by":"publisher","first-page":"3358","DOI":"10.1016\/j.patcog.2007.04.009","volume":"40","author":"Y Sun","year":"2007","unstructured":"Sun Y, Kamel MS, Wong AK, Wang Y (2007) Cost-sensitive boosting for classification of imbalanced data. Pattern Recogn 40(12):3358\u20133378","journal-title":"Pattern Recogn"},{"key":"186_CR23","doi-asserted-by":"publisher","first-page":"69","DOI":"10.1016\/j.knosys.2015.05.027","volume":"87","author":"Isaac Triguero","year":"2015","unstructured":"Triguero I, del R\u00edo S, L\u00f3pez V, Bacardit J, Ben\u00edtez JM, Herrera F (2015) ROSEFW-RF: The winner algorithm for the ECBDL\u201914 big data competition: an extremely imbalanced big data bioinformatics problem. Knowledge-Based Syst 87:69\u201379. \nhttps:\/\/doi.org\/10.1016\/j.knosys.2015.05.027\n\n. \nhttp:\/\/www.sciencedirect.com\/science\/article\/pii\/S0950705115002130","journal-title":"Knowledge-Based Systems"},{"key":"186_CR24","doi-asserted-by":"publisher","first-page":"99","DOI":"10.2307\/3001913","volume":"5","author":"JW Tukey","year":"1949","unstructured":"Tukey JW (1949) Comparing individual means in the analysis of variance. Biometrics 5:99\u2013114","journal-title":"Biometrics"},{"key":"186_CR25","unstructured":"US Census Bureau (2018) US and World Population Clock. \nhttps:\/\/www.census.gov\/popclock\/"},{"issue":"8","key":"186_CR26","doi-asserted-by":"publisher","first-page":"1450","DOI":"10.1158\/1055-9965.EPI-14-0295","volume":"23","author":"J. A. Usher-Smith","year":"2014","unstructured":"Usher-Smith JA, Emery J, Kassianos AP, Walter FM (2014) Risk prediction models for melanoma: a systematic review. Cancer Epidemiol Biomark Prev 23(8):1450\u20131463. \nhttps:\/\/doi.org\/10.1158\/1055-9965.EPI-14-0295\n\n. \nhttp:\/\/cebp.aacrjournals.org\/cgi\/doi\/10.1158\/1055-9965.EPI-14-0295","journal-title":"Cancer Epidemiology Biomarkers & Prevention"},{"key":"186_CR27","doi-asserted-by":"crossref","unstructured":"Van Hulse J, Khoshgoftaar TM, Napolitano A (2007) Experimental perspectives on learning from imbalanced data. In: Proceedings of the 24th International Conference on Machine Learning, ACM, pp 935\u2013942","DOI":"10.1145\/1273496.1273614"},{"issue":"2","key":"186_CR28","doi-asserted-by":"publisher","first-page":"22","DOI":"10.1109\/MCSE.2011.37","volume":"13","author":"S Walt van der","year":"2011","unstructured":"van der Walt S, Colbert SC, Varoquaux G (2011) The numpy array: a structure for efficient numerical computation. Comput Sci Eng 13(2):22\u201330. \nhttps:\/\/doi.org\/10.1109\/MCSE.2011.37","journal-title":"Comput Sci Eng"},{"issue":"1","key":"186_CR29","doi-asserted-by":"publisher","first-page":"e0146,473","DOI":"10.1371\/journal.pone.0146473","volume":"11","author":"A Yu","year":"2016","unstructured":"Yu A, Woo SM, Joo J, Yang HR, Lee WJ, Park SJ, Nam BH (2016) Development and validation of a prediction model to estimate individual risk of pancreatic cancer. PLoS One 11(1):e0146,473. \nhttps:\/\/doi.org\/10.1371\/journal.pone.0146473","journal-title":"PLoS One"},{"issue":"11","key":"186_CR30","doi-asserted-by":"publisher","first-page":"56","DOI":"10.1145\/2934664","volume":"59","author":"M Zaharia","year":"2016","unstructured":"Zaharia M, Xin RS, Wendell P, Das T, Armbrust M, Dave A, Meng X, Rosen J, Venkataraman S, Franklin MJ et al (2016) Apache Spark: a unified engine for big data processing. Commun ACM 59(11):56\u201365","journal-title":"Commun ACM"}],"container-title":["Network Modeling Analysis in Health Informatics and Bioinformatics"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s13721-019-0186-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s13721-019-0186-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s13721-019-0186-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,4,2]],"date-time":"2020-04-02T23:20:36Z","timestamp":1585869636000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s13721-019-0186-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,4,4]]},"references-count":30,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2019,12]]}},"alternative-id":["186"],"URL":"https:\/\/doi.org\/10.1007\/s13721-019-0186-4","relation":{},"ISSN":["2192-6662","2192-6670"],"issn-type":[{"type":"print","value":"2192-6662"},{"type":"electronic","value":"2192-6670"}],"subject":[],"published":{"date-parts":[[2019,4,4]]},"assertion":[{"value":"17 January 2019","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"24 March 2019","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"26 March 2019","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 April 2019","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Compliance with ethical standards"}},{"value":"The authors declare that they have no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"7"}}