{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T07:26:32Z","timestamp":1740122792859,"version":"3.37.3"},"reference-count":42,"publisher":"Springer Science and Business Media LLC","issue":"8","license":[{"start":{"date-parts":[[2023,7,29]],"date-time":"2023-07-29T00:00:00Z","timestamp":1690588800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,7,29]],"date-time":"2023-07-29T00:00:00Z","timestamp":1690588800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100014188","name":"Ministry of Science and ICT, South Korea","doi-asserted-by":"publisher","award":["NRF-2017R1E1A1A03070105","NRF-2019R1A5A1028324"],"award-info":[{"award-number":["NRF-2017R1E1A1A03070105","NRF-2019R1A5A1028324"]}],"id":[{"id":"10.13039\/501100014188","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100003621","name":"Ministry of Science, ICT and Future Planning","doi-asserted-by":"publisher","award":["2019-0-01906","RS-2023-00219980","RS-2022-00165268"],"award-info":[{"award-number":["2019-0-01906","RS-2023-00219980","RS-2022-00165268"]}],"id":[{"id":"10.13039\/501100003621","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Neural Process Lett"],"published-print":{"date-parts":[[2023,12]]},"DOI":"10.1007\/s11063-023-11355-5","type":"journal-article","created":{"date-parts":[[2023,7,29]],"date-time":"2023-07-29T16:01:50Z","timestamp":1690646510000},"page":"10873-10904","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Concept-Oriented Self-Explaining Neural Networks"],"prefix":"10.1007","volume":"55","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-8766-6934","authenticated-orcid":false,"given":"Min Sue","family":"Park","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3678-2687","authenticated-orcid":false,"given":"Hyung Ju","family":"Hwang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2023,7,29]]},"reference":[{"key":"11355_CR1","doi-asserted-by":"crossref","unstructured":"Ribeiro MT, Singh S, Guestrin C (2016) \u201c why should i trust you?\u201d Explaining the predictions of any classifier. In: Proceedings of the 22nd ACM SIGKDD international conference on knowledge discovery and data mining, pp 1135\u20131144","DOI":"10.1145\/2939672.2939778"},{"key":"11355_CR2","unstructured":"Lundberg S, Lee S-I (2017) A unified approach to interpreting model predictions, arXiv preprint arXiv:1705.07874"},{"key":"11355_CR3","doi-asserted-by":"publisher","first-page":"124887","DOI":"10.1109\/ACCESS.2021.3110270","volume":"9","author":"MS Park","year":"2021","unstructured":"Park MS, Son H, Hyun C, Hwang HJ (2021) Explainability of machine learning models for bankruptcy prediction. IEEE Access 9:124887\u2013124899","journal-title":"IEEE Access"},{"issue":"CSCW1","key":"11355_CR4","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3392878","volume":"4","author":"SR Hong","year":"2020","unstructured":"Hong SR, Hullman J, Bertini E (2020) Human factors in model interpretability: industry practices, challenges, and needs. Proc ACM Human-Comput Interact 4(CSCW1):1\u201326","journal-title":"Proc ACM Human-Comput Interact"},{"issue":"5","key":"11355_CR5","doi-asserted-by":"publisher","first-page":"206","DOI":"10.1038\/s42256-019-0048-x","volume":"1","author":"C Rudin","year":"2019","unstructured":"Rudin C (2019) Stop explaining black box machine learning models for high stakes decisions and use interpretable models instead. Nat Mach Intell 1(5):206\u2013215","journal-title":"Nat Mach Intell"},{"key":"11355_CR6","doi-asserted-by":"crossref","unstructured":"Schallner L, Rabold J, Scholz O, Schmid U (2019) Effect of superpixel aggregation on explanations in lime\u2013a case study with biological data. In: Joint European conference on machine learning and knowledge discovery in databases. Springer, pp 147\u2013158","DOI":"10.1007\/978-3-030-43823-4_13"},{"key":"11355_CR7","doi-asserted-by":"crossref","unstructured":"Chen T, Guestrin C (2016) Xgboost: A scalable tree boosting system. In: Proceedings of the 22nd ACM sigkdd international conference on knowledge discovery and data mining, pp 785\u2013794","DOI":"10.1145\/2939672.2939785"},{"key":"11355_CR8","first-page":"3146","volume":"30","author":"G Ke","year":"2017","unstructured":"Ke G, Meng Q, Finley T, Wang T, Chen W, Ma W, Ye Q, Liu T-Y (2017) Lightgbm: a highly efficient gradient boosting decision tree. Adv Neural Inf Process Syst 30:3146\u20133154","journal-title":"Adv Neural Inf Process Syst"},{"key":"11355_CR9","unstructured":"Alvarez\u00a0Melis D, Jaakkola T (2018) Towards robust interpretability with self-explaining neural networks. In: Bengio S, Wallach H, Larochelle H, Grauman K, Cesa-Bianchi N, Garnett R (eds) Advances in neural information processing systems, Vol.\u00a031, Curran Associates, Inc. https:\/\/proceedings.neurips.cc\/paper\/2018\/file\/3e9f0fc9b2f89e043bc6233994dfcf76-Paper.pdf"},{"key":"11355_CR10","unstructured":"Kim H, Mnih A (2018) Disentangling by factorising. In: International conference on machine learning, PMLR, pp 2649\u20132658"},{"key":"11355_CR11","unstructured":"Nair V, Hinton GE (2010) Rectified linear units improve restricted Boltzmann machines, In: Icml"},{"key":"11355_CR12","unstructured":"Lu L, Shin Y, Su Y, Karniadakis GE (2019) Dying ReLu and initialization: theory and numerical examples, arXiv preprint arXiv:1903.06733"},{"key":"11355_CR13","unstructured":"Shao J, Hu K, Wang C, Xue X, Raj B (2020) Is normalization indispensable for training deep neural network? Adv Neural Inf Process Syst 33"},{"key":"11355_CR14","unstructured":"Clevert D-A, Unterthiner T, Hochreiter S (2015) Fast and accurate deep network learning by exponential linear units (elus), arXiv preprint arXiv:1511.07289"},{"issue":"26","key":"11355_CR15","doi-asserted-by":"publisher","first-page":"1629","DOI":"10.1056\/NEJM198512263132604","volume":"313","author":"K Godfrey","year":"1985","unstructured":"Godfrey K (1985) Simple linear regression in medical research. N Engl J Med 313(26):1629\u20131636","journal-title":"N Engl J Med"},{"key":"11355_CR16","volume-title":"Statistics and finance: an introduction","author":"D Ruppert","year":"2014","unstructured":"Ruppert D (2014) Statistics and finance: an introduction. Springer, New York"},{"issue":"2\u20133","key":"11355_CR17","doi-asserted-by":"publisher","first-page":"360","DOI":"10.1177\/0049124189018002006","volume":"18","author":"JA Dubin","year":"1989","unstructured":"Dubin JA, Rivers D (1989) Selection bias in linear regression, logit and probit models. Sociol Methods Res 18(2\u20133):360\u2013390","journal-title":"Sociol Methods Res"},{"key":"11355_CR18","doi-asserted-by":"publisher","DOI":"10.1016\/j.asoc.2019.105524","volume":"97","author":"D Singh","year":"2020","unstructured":"Singh D, Singh B (2020) Investigating the impact of data normalization on classification performance. Appl Soft Comput 97:105524","journal-title":"Appl Soft Comput"},{"issue":"3","key":"11355_CR19","doi-asserted-by":"publisher","first-page":"1464","DOI":"10.1109\/23.589532","volume":"44","author":"J Sola","year":"1997","unstructured":"Sola J, Sevilla J (1997) Importance of input data normalization for the application of neural networks to complex industrial problems. IEEE Trans Nucl Sci 44(3):1464\u20131468","journal-title":"IEEE Trans Nucl Sci"},{"key":"11355_CR20","unstructured":"Ioffe S, Szegedy C (2015) Batch normalization: accelerating deep network training by reducing internal covariate shift. In: International conference on machine learning, PMLR, pp 448\u2013456"},{"key":"11355_CR21","unstructured":"Santurkar S, Tsipras D, Ilyas A, Madry A (2018) How does batch normalization help optimization? arXiv preprint arXiv:1805.11604"},{"key":"11355_CR22","unstructured":"Eidnes L, N\u00f8kland A, Shifting mean activation towards zero with bipolar activation function"},{"key":"11355_CR23","unstructured":"Klambauer G, Unterthiner T, Mayr A, Hochreiter S (2017) Self-normalizing neural networks, arXiv preprint arXiv:1706.02515"},{"issue":"1","key":"11355_CR24","doi-asserted-by":"publisher","first-page":"66","DOI":"10.1147\/rd.41.0066","volume":"4","author":"S Watanabe","year":"1960","unstructured":"Watanabe S (1960) Information theoretical analysis of multivariate correlation. IBM J Res Dev 4(1):66\u201382","journal-title":"IBM J Res Dev"},{"key":"11355_CR25","unstructured":"Kim H, Mnih A (2018) Disentangling by factorising. In: International conference on machine learning, PMLR, pp 2649\u20132658"},{"key":"11355_CR26","doi-asserted-by":"crossref","unstructured":"Fu H, Li C, Liu X, Gao J, Celikyilmaz A, Carin L (2019) Cyclical annealing schedule: a simple approach to mitigating kl vanishing, arXiv preprint arXiv:1903.10145","DOI":"10.18653\/v1\/N19-1021"},{"key":"11355_CR27","doi-asserted-by":"crossref","unstructured":"Panaretos VM, Zemel Y (2020) The wasserstein space. In: International workshop on functional and operatorial statistics. Springer, pp 37\u201357","DOI":"10.1007\/978-3-030-38438-8_2"},{"key":"11355_CR28","unstructured":"Xiao Y, Wang WY. Disentangled representation learning with wasserstein total correlation, arXiv preprint arXiv:1912.12818"},{"key":"11355_CR29","volume-title":"Optimal transport: old and new","author":"C Villani","year":"2008","unstructured":"Villani C (2008) Optimal transport: old and new, vol 338. Springer, New York"},{"key":"11355_CR30","unstructured":"Gulrajani I, Ahmed F, Arjovsky M, Dumoulin V, Courville A (2017) Improved training of wasserstein gans, arXiv preprint arXiv:1704.00028"},{"key":"11355_CR31","unstructured":"Arjovsky M, Chintala S, Bottou L (2017) Wasserstein generative adversarial networks. In: International conference on machine learning, PMLR, pp 214\u2013223"},{"key":"11355_CR32","unstructured":"Tolstikhin I, Bousquet O, Gelly S, Schoelkopf B (2017) Wasserstein auto-encoders, arXiv preprint arXiv:1711.01558"},{"key":"11355_CR33","doi-asserted-by":"crossref","unstructured":"Arcones MA, Gine E (1992) On the bootstrap of u and v statistics. Ann Stat, pp 655\u2013674","DOI":"10.1214\/aos\/1176348650"},{"key":"11355_CR34","unstructured":"Brock A, Lim T, Ritchie JM, Weston N (2016) Neural photo editing with introspective adversarial networks, arXiv preprint arXiv:1609.07093"},{"key":"11355_CR35","unstructured":"Brock A, Donahue J, Simonyan K (2018) Large scale gan training for high fidelity natural image synthesis, arXiv preprint arXiv:1809.11096"},{"key":"11355_CR36","unstructured":"Doshi-Velez F, Kim B (2017) Towards a rigorous science of interpretable machine learning, arXiv preprint arXiv:1702.08608"},{"key":"11355_CR37","unstructured":"LeCun Y, Cortes C, Burges C (2010) Mnist handwritten digit database, ATT Labs.http:\/\/yann.lecun.com\/exdb\/mnist 2"},{"key":"11355_CR38","unstructured":"Xiao H, Rasul K, Vollgraf R (2017) Fashion-mnist: a novel image dataset for benchmarking machine learning algorithms, arXiv preprint arXiv:1708.07747"},{"key":"11355_CR39","unstructured":"Krizhevsky A, Nair V, Hinton G (2014) The cifar-10 dataset. http:\/\/www.cs.toronto.edu\/kriz\/cifar.html 55(5)"},{"issue":"11","key":"11355_CR40","doi-asserted-by":"publisher","first-page":"5847","DOI":"10.1109\/TIT.2010.2068870","volume":"56","author":"X Nguyen","year":"2010","unstructured":"Nguyen X, Wainwright MJ, Jordan MI (2010) Estimating divergence functionals and the likelihood ratio by convex risk minimization. IEEE Trans Inf Theory 56(11):5847\u20135861","journal-title":"IEEE Trans Inf Theory"},{"issue":"5","key":"11355_CR41","doi-asserted-by":"publisher","first-page":"1009","DOI":"10.1007\/s10463-011-0343-8","volume":"64","author":"M Sugiyama","year":"2012","unstructured":"Sugiyama M, Suzuki T, Kanamori T (2012) Density-ratio matching under the Bregman divergence: a unified framework of density-ratio estimation. Ann Inst Stat Math 64(5):1009\u20131044","journal-title":"Ann Inst Stat Math"},{"key":"11355_CR42","doi-asserted-by":"crossref","unstructured":"Bowman SR, Vilnis L, Vinyals O, Dai AM, Jozefowicz R, Bengio S (2015) Generating sentences from a continuous space, arXiv preprint arXiv:1511.06349","DOI":"10.18653\/v1\/K16-1002"}],"container-title":["Neural Processing Letters"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11063-023-11355-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11063-023-11355-5\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11063-023-11355-5.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,11,22]],"date-time":"2023-11-22T05:13:17Z","timestamp":1700629997000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11063-023-11355-5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,7,29]]},"references-count":42,"journal-issue":{"issue":"8","published-print":{"date-parts":[[2023,12]]}},"alternative-id":["11355"],"URL":"https:\/\/doi.org\/10.1007\/s11063-023-11355-5","relation":{},"ISSN":["1370-4621","1573-773X"],"issn-type":[{"type":"print","value":"1370-4621"},{"type":"electronic","value":"1573-773X"}],"subject":[],"published":{"date-parts":[[2023,7,29]]},"assertion":[{"value":"8 July 2023","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"29 July 2023","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}