{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,7]],"date-time":"2026-04-07T07:20:34Z","timestamp":1775546434681,"version":"3.50.1"},"reference-count":47,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2020,8,16]],"date-time":"2020-08-16T00:00:00Z","timestamp":1597536000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,8,16]],"date-time":"2020-08-16T00:00:00Z","timestamp":1597536000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Mach Learn"],"published-print":{"date-parts":[[2021,1]]},"DOI":"10.1007\/s10994-020-05896-2","type":"journal-article","created":{"date-parts":[[2020,8,16]],"date-time":"2020-08-16T19:02:25Z","timestamp":1597604545000},"page":"89-138","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":87,"title":["Interpretable clustering: an optimization approach"],"prefix":"10.1007","volume":"110","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-1985-1003","authenticated-orcid":false,"given":"Dimitris","family":"Bertsimas","sequence":"first","affiliation":[]},{"given":"Agni","family":"Orfanoudaki","sequence":"additional","affiliation":[]},{"given":"Holly","family":"Wiberg","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2020,8,16]]},"reference":[{"key":"5896_CR1","unstructured":"Arthur, D., & Vassilvitskii, S. (2007). k-means++: The advantages of careful seeding. In Proceedings of the 18th annual ACM-SIAM symposium on Discrete algorithms (pp 1027\u20131035). Society for Industrial and Applied Mathematics."},{"key":"5896_CR2","doi-asserted-by":"publisher","first-page":"121","DOI":"10.1109\/TKDE.2005.11","volume":"17","author":"J Basak","year":"2005","unstructured":"Basak, J., & Krishnapuram, R. (2005). Interpretable hierarchical clustering by constructing an unsupervised decision tree. IEEE Transactions on Knowledge and Data Engineering, 17, 121\u2013132. https:\/\/doi.org\/10.1109\/TKDE.2005.11.","journal-title":"IEEE Transactions on Knowledge and Data Engineering"},{"issue":"7","key":"5896_CR3","doi-asserted-by":"publisher","first-page":"1039","DOI":"10.1007\/s10994-017-5633-9","volume":"106","author":"D Bertsimas","year":"2017","unstructured":"Bertsimas, D., & Dunn, J. (2017). Optimal classification trees. Machine Learning, 106(7), 1039\u20131082.","journal-title":"Machine Learning"},{"key":"5896_CR4","volume-title":"Machine Learning under a Modern Optimization Lens","author":"D Bertsimas","year":"2019","unstructured":"Bertsimas, D., & Dunn, J. (2019). Machine Learning under a Modern Optimization Lens. Waltham: Dynamic Ideas Press."},{"key":"5896_CR5","volume-title":"The Analytics Edge","author":"D Bertsimas","year":"2016","unstructured":"Bertsimas, D., O\u2019Hair, A. K., & Pulleybank, W. R. (2016). The Analytics Edge. Waltham: Dynamic Ideas Press."},{"key":"5896_CR6","unstructured":"Bezanson, J., Karpinski, S., Shah, V.B., & Edelman, A. (2012). Julia: A fast dynamic language for technical computing. arXiv preprint.\u00a0arXiv:1209.5145."},{"key":"5896_CR7","unstructured":"Blockeel, H., De\u00a0Raedt, L., & Ramon, J. (2000) Top-down induction of clustering trees. arXiv preprint.\u00a0arXiv:cs\/0011032."},{"key":"5896_CR8","volume-title":"Classification and regression trees","author":"L Breiman","year":"1984","unstructured":"Breiman, L., Friedman, J., Stone, C. J., & Olshen, R. A. (1984). Classification and regression trees. Boca Raton: CRC Press."},{"issue":"4","key":"5896_CR9","first-page":"87","volume":"47","author":"M Chavent","year":"1999","unstructured":"Chavent, M., Guinot, C., Lechevallier, Y., & Tenenhaus, M. (1999). M\u00e9thodes divisives de classification et segmentation non supervis\u00e9e : recherche d\u2019une typologie de la peau humaine saine. Revue de Statistique Appliqu\u00e9e, 47(4), 87\u201399.","journal-title":"Revue de Statistique Appliqu\u00e9e"},{"key":"5896_CR10","volume-title":"A change of heart: Unraveling the mysteries of cardiovascular disease","author":"SB Daniel Levy","year":"2006","unstructured":"Daniel Levy, S. B. (2006). A change of heart: Unraveling the mysteries of cardiovascular disease. New York: Vintage."},{"key":"5896_CR11","doi-asserted-by":"publisher","unstructured":"Diday, E., & Simon, J. C. (1976). Clustering analysis (pp. 47\u201394). Berlin: Springer. https:\/\/doi.org\/10.1007\/978-3-642-96303-2_3.","DOI":"10.1007\/978-3-642-96303-2_3"},{"key":"5896_CR12","unstructured":"Doshi-Velez, F., & Kim, B. (2017). Towards a rigorous science of interpretable machine learning.\u00a0arXiv preprint. arXiv:1702.08608."},{"issue":"1","key":"5896_CR13","doi-asserted-by":"publisher","first-page":"95","DOI":"10.1080\/01969727408546059org\/10.1080\/01969727408546059","volume":"4","author":"JC Dunn","year":"1974","unstructured":"Dunn, J. C. (1974). Well-separated clusters and optimal fuzzy partitions. Journal of Cybernetics, 4(1), 95\u2013104. https:\/\/doi.org\/10.1080\/01969727408546059org\/10.1080\/01969727408546059.","journal-title":"Journal of Cybernetics"},{"key":"5896_CR14","unstructured":"Dunn, J. W. (2018). Optimal trees for prediction and prescription. PhD thesis, Massachusetts Institute of Technology."},{"key":"5896_CR15","first-page":"100","volume-title":"Cluster analysis","author":"B Duran","year":"1974","unstructured":"Duran, B., & Odell, P. (1974). Cluster analysis (1st ed., p. 100). Berlin: Springer.","edition":"1"},{"key":"5896_CR16","first-page":"226","volume":"96","author":"M Ester","year":"1996","unstructured":"Ester, M., Kriegel, H. P., Sander, J., Xu, X., et al. (1996). A density-based algorithm for discovering clusters in large spatial databases with noise. Kdd, 96, 226\u2013231.","journal-title":"Kdd"},{"issue":"20","key":"5896_CR17","doi-asserted-by":"publisher","first-page":"1605","DOI":"10.1001\/jama.1995.03520440059037","volume":"273","author":"J Everhart","year":"1995","unstructured":"Everhart, J., & Wright, D. (1995). Diabetes mellitus as a risk factor for pancreatic cancer: A meta-analysis. JAMA, 273(20), 1605\u20131609.","journal-title":"JAMA"},{"issue":"4","key":"5896_CR18","doi-asserted-by":"publisher","first-page":"518","DOI":"10.1016\/0091-7435(75)90037-7","volume":"4","author":"M Feinleib","year":"1975","unstructured":"Feinleib, M., Kannel, W., Garrison, R., McNamara, P., & Castelli, W. (1975). The framingham offspring study. Design and preliminary data. Preventive Medicine, 4(4), 518\u2013525. https:\/\/doi.org\/10.1016\/0091-7435(75)90037-7.","journal-title":"Preventive Medicine"},{"key":"5896_CR19","first-page":"768","volume":"21","author":"EW Forgy","year":"1965","unstructured":"Forgy, E. W. (1965). Cluster analysis of multivariate data: Efficiency versus interpretability of classifications. Biometrics, 21, 768\u2013769.","journal-title":"Biometrics"},{"issue":"2","key":"5896_CR20","doi-asserted-by":"publisher","first-page":"125","DOI":"10.1007\/s11634-013-0129-3","volume":"7","author":"R Fraiman","year":"2013","unstructured":"Fraiman, R., Ghattas, B., & Svarc, M. (2013). Interpretable clustering using unsupervised binary trees. Advances in Data Analysis and Classification, 7(2), 125\u2013145. https:\/\/doi.org\/10.1007\/s11634-013-0129-3. arXiv:1103.5339.","journal-title":"Advances in Data Analysis and Classification"},{"key":"5896_CR21","unstructured":"Goodman, B., & Flaxman, S. (2016). European union regulations on algorithmic decision-making and a \u201cright to explanation\u201d. arXiv preprint. arXiv:1606.08813."},{"issue":"1","key":"5896_CR22","doi-asserted-by":"publisher","first-page":"1","DOI":"10.18637\/jss.v091.i01","volume":"Articles 91","author":"M Hahsler","year":"2019","unstructured":"Hahsler, M., Piekenbrock, M., & Doran, D. (2019). dbscan: Fast density-based clustering with r. Journal of Statistical Software, Articles 91(1), 1\u201330. https:\/\/doi.org\/10.18637\/jss.v091.i01.","journal-title":"Journal of Statistical Software"},{"issue":"2","key":"5896_CR23","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1023\/A:1012801612483","volume":"17","author":"M Halkidi","year":"2001","unstructured":"Halkidi, M., Batistakis, Y., & Vazirgiannis, M. (2001). On clustering validation techniques. Journal of Intelligent Information Systems, 17(2), 107\u2013145. https:\/\/doi.org\/10.1023\/A:1012801612483.","journal-title":"Journal of Intelligent Information Systems"},{"key":"5896_CR24","unstructured":"Hancock, T. P., Coomans, D. H., & Everingham, Y. L. (2003). Supervised Hierarchical Clustering Using CART. In Proceedings of MODSIM 2003 International Congress on Modelling and Simulation, Townsville, QLD, Australia (pp. 1880\u20131885)."},{"key":"5896_CR25","doi-asserted-by":"crossref","unstructured":"Hastie, T., Tibshirani, R., & Friedman, J. (2009). Unsupervised learning. In The elements of statistical learning (pp 485\u2013585). Springer.","DOI":"10.1007\/978-0-387-84858-7_14"},{"issue":"3","key":"5896_CR26","doi-asserted-by":"publisher","first-page":"264","DOI":"10.1145\/331499.331504","volume":"31","author":"AK Jain","year":"1999","unstructured":"Jain, A. K., Murty, M. N., & Flynn, P. J. (1999). Data clustering: A review. ACM Computing Surveys, 31(3), 264\u2013323. https:\/\/doi.org\/10.1145\/331499.331504.","journal-title":"ACM Computing Surveys"},{"key":"5896_CR27","doi-asserted-by":"crossref","unstructured":"Jolliffe, I. (2011). Principal component analysis. In International encyclopedia of statistical science (pp. 1094\u20131096). Springer.","DOI":"10.1007\/978-3-642-04898-2_455"},{"issue":"20","key":"5896_CR28","doi-asserted-by":"publisher","first-page":"1571","DOI":"10.1001\/jama.1996.03530440051036","volume":"275","author":"WB Kannel","year":"1996","unstructured":"Kannel, W. B. (1996). Blood pressure as a cardiovascular risk factor: Prevention and treatment. JAMA, 275(20), 1571\u20131576.","journal-title":"JAMA"},{"key":"5896_CR29","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9781139523967","volume-title":"Geometric methods in signal and image analysis","author":"H Krim","year":"2015","unstructured":"Krim, H., & Hamza, A. B. (2015). Geometric methods in signal and image analysis. Cambridge: Cambridge University Press."},{"key":"5896_CR30","doi-asserted-by":"crossref","DOI":"10.1002\/9781118874059","volume-title":"Discovering knowledge in data: An introduction to data mining","author":"DT Larose","year":"2014","unstructured":"Larose, D. T., & Larose, C. D. (2014). Discovering knowledge in data: An introduction to data mining. Hoboken: Wiley."},{"key":"5896_CR31","doi-asserted-by":"crossref","unstructured":"Liu, B., Xia, Y., & Yu, P. S. (2000). Clustering through decision tree construction. In Proceedings of the ninth international conference on Information and knowledge management - CIKM \u201900, McLean, VA (pp. 20\u201329). https:\/\/doi.org\/10.1145\/354756.354775.\u00a0arXiv:1011.1669v3.","DOI":"10.1145\/354756.354775"},{"key":"5896_CR32","doi-asserted-by":"crossref","unstructured":"Liu, Y., Li, Z., Xiong, H., Gao, X., & Wu, J. (2010). Understanding of internal clustering validation measures. In IEEE 10th International Conference on Data Mining (ICDM), 2010 (pp 911\u2013916). IEEE.","DOI":"10.1109\/ICDM.2010.35"},{"key":"5896_CR33","unstructured":"MacQueen, J. (1967). Some methods for classification and analysis of multivariate observations. In Proceedings of the 5th Berkeley symposium on mathematical statistics and probability, volume 1: Statistics (pp. 281\u2013297). Berkeley, CA: University of California Press."},{"issue":"12","key":"5896_CR34","doi-asserted-by":"publisher","first-page":"1650","DOI":"10.1109\/TPAMI.2002.1114856","volume":"24","author":"U Maulik","year":"2002","unstructured":"Maulik, U., & Bandyopadhyay, S. (2002). Performance evaluation of some clustering algorithms and validity indices. IEEE Transactions on Pattern Analysis and Machine Intelligence, 24(12), 1650\u20131654.","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"5896_CR35","unstructured":"Mouselimis, L. (2019). ClusterR: Gaussian Mixture Models, K-Means, Mini-Batch-Kmeans, K-Medoids and Affinity Propagation Clustering. R package version, 1(2)."},{"issue":"9","key":"5896_CR36","doi-asserted-by":"publisher","first-page":"935","DOI":"10.1001\/archsurg.134.9.935","volume":"134","author":"PJ Offner","year":"1999","unstructured":"Offner, P. J., Moore, E. E., & Biffl, W. L. (1999). Male gender is a risk factor for major infections after surgery. Archives of Surgery, 134(9), 935\u2013940.","journal-title":"Archives of Surgery"},{"issue":"2","key":"5896_CR37","doi-asserted-by":"publisher","first-page":"70","DOI":"10.1145\/1233321.1233330","volume":"8","author":"G Piatetsky-Shapiro","year":"2006","unstructured":"Piatetsky-Shapiro, G., Djeraba, C., Getoor, L., Grossman, R., Feldman, R., & Zaki, M. (2006). What are the grand challenges for data mining?: Kdd-2006 panel report. ACM SIGKDD Explorations Newsletter, 8(2), 70\u201377.","journal-title":"ACM SIGKDD Explorations Newsletter"},{"issue":"6","key":"5896_CR38","doi-asserted-by":"publisher","first-page":"919","DOI":"10.1016\/j.ipm.2003.10.006","volume":"40","author":"DR Radev","year":"2004","unstructured":"Radev, D. R., Jing, H., Sty\u015b, M., & Tam, D. (2004). Centroid-based summarization of multiple documents. Information Processing and Management, 40(6), 919\u2013938. https:\/\/doi.org\/10.1016\/j.ipm.2003.10.006.","journal-title":"Information Processing and Management"},{"issue":"4","key":"5896_CR39","first-page":"329","volume":"26","author":"CR Rao","year":"1964","unstructured":"Rao, C. R. (1964). The use and interpretation of principal component analysis in applied research. Sankhy\u0101: The Indian Journal of Statistics, Series A (1961-2002), 26(4), 329\u2013358.","journal-title":"Sankhy\u0101: The Indian Journal of Statistics, Series A (1961-2002)"},{"key":"5896_CR40","doi-asserted-by":"publisher","first-page":"53","DOI":"10.1016\/0377-0427(87)90125-7","volume":"20","author":"PJ Rousseeuw","year":"1987","unstructured":"Rousseeuw, P. J. (1987). Silhouettes: A graphical aid to the interpretation and validation of cluster analysis. Journal of Computational and Applied Mathematics, 20, 53\u201365.","journal-title":"Journal of Computational and Applied Mathematics"},{"key":"5896_CR41","doi-asserted-by":"crossref","unstructured":"Ruspini, E. H. (1970). Numerical methods for fuzzy clustering.\u00a0Information Sciences,\u00a02(3),\u00a0319\u2013350.","DOI":"10.1016\/S0020-0255(70)80056-1"},{"key":"5896_CR42","unstructured":"Sneath, P. H., Sokal, R. R., et al. (1973). Numerical taxonomy. The Principles and Practice of Numerical Classification."},{"issue":"1","key":"5896_CR43","doi-asserted-by":"publisher","first-page":"43","DOI":"10.1016\/0004-3702(86)90030-5","volume":"28","author":"RE Stepp","year":"1986","unstructured":"Stepp, R. E., & Michalski, R. S. (1986). Conceptual clustering of structured objects: A goal-oriented approach. Artificial Intelligence, 28(1), 43\u201369.","journal-title":"Artificial Intelligence"},{"key":"5896_CR44","unstructured":"Ultsch, A. (2005). Fundamental clustering problems suite (FCPS). Technical report, University of Marburg."},{"issue":"7","key":"5896_CR45","doi-asserted-by":"publisher","first-page":"1025","DOI":"10.1001\/jama.1988.03720070025028","volume":"259","author":"PA Wolf","year":"1988","unstructured":"Wolf, P. A., D\u2019Agostino, R. B., Kannel, W. B., Bonita, R., & Belanger, A. J. (1988). Cigarette smoking as a risk factor for stroke: The framingham study. JAMA, 259(7), 1025\u20131029.","journal-title":"JAMA"},{"key":"5896_CR46","doi-asserted-by":"crossref","unstructured":"Wu, J., Xiong, H., & Chen, J. (2009). Adapting the right measures for k-means clustering. In Proceedings of the 15th ACM SIGKDD international conference on Knowledge discovery and data mining (pp. 877\u2013886). ACM.","DOI":"10.1145\/1557019.1557115"},{"issue":"04","key":"5896_CR47","doi-asserted-by":"publisher","first-page":"597","DOI":"10.1142\/S0219622006002258","volume":"5","author":"Q Yang","year":"2006","unstructured":"Yang, Q., & Wu, X. (2006). 10 challenging problems in data mining research. International Journal of Information Technology & Decision Making, 5(04), 597\u2013604.","journal-title":"International Journal of Information Technology & Decision Making"}],"container-title":["Machine Learning"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10994-020-05896-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10994-020-05896-2\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10994-020-05896-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,10,5]],"date-time":"2023-10-05T21:20:28Z","timestamp":1696540828000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10994-020-05896-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,8,16]]},"references-count":47,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2021,1]]}},"alternative-id":["5896"],"URL":"https:\/\/doi.org\/10.1007\/s10994-020-05896-2","relation":{},"ISSN":["0885-6125","1573-0565"],"issn-type":[{"value":"0885-6125","type":"print"},{"value":"1573-0565","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,8,16]]},"assertion":[{"value":"9 February 2019","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"30 June 2020","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"7 July 2020","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"16 August 2020","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"This content has been made available to all.","name":"free","label":"Free to read"}]}}