{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,7]],"date-time":"2025-10-07T14:32:08Z","timestamp":1759847528269,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":35,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,7,15]],"date-time":"2023-07-15T00:00:00Z","timestamp":1689379200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"DOI":"10.13039\/501100001321","name":"National Research Foundation","doi-asserted-by":"publisher","award":["13819413"],"award-info":[{"award-number":["13819413"]}],"id":[{"id":"10.13039\/501100001321","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,7,15]]},"DOI":"10.1145\/3583133.3596321","type":"proceedings-article","created":{"date-parts":[[2023,7,24]],"date-time":"2023-07-24T23:30:33Z","timestamp":1690241433000},"page":"2029-2037","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":4,"title":["Empirical Loss Landscape Analysis of Neural Network Activation Functions"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-3546-1467","authenticated-orcid":false,"given":"Anna Sergeevna","family":"Bosman","sequence":"first","affiliation":[{"name":"Computer Science, University of Pretoria, Pretoria, Gauteng, South Africa"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0242-3539","authenticated-orcid":false,"given":"Andries","family":"Engelbrecht","sequence":"additional","affiliation":[{"name":"University of Stellenbosch, Stellenbosch, South Africa"},{"name":"Center for Applied Mathematics and Bioinformatics, Gulf University for Science and Technology, Kuwait City, Kuwait"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4907-0662","authenticated-orcid":false,"given":"Marde","family":"Helbig","sequence":"additional","affiliation":[{"name":"School of Information and Communication Technology, Griffith University, Southport, Australia"}]}],"member":"320","published-online":{"date-parts":[[2023,7,24]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"Proceedings of the International Conference on Learning Representations","author":"Arora Raman","year":"2018","unstructured":"Raman Arora , Amitabh Basu , Poorya Mianjy , and Anirbit Mukherjee . 2018 . Understanding deep neural networks with rectified linear units . In Proceedings of the International Conference on Learning Representations . Vancouver, Canada, 1--17. Raman Arora, Amitabh Basu, Poorya Mianjy, and Anirbit Mukherjee. 2018. Understanding deep neural networks with rectified linear units. In Proceedings of the International Conference on Learning Representations. Vancouver, Canada, 1--17."},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2020.02.113"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1109\/SSCI.2016.7850152"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/3205651.3208247"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN48605.2020.9206727"},{"key":"e_1_3_2_1_6_1","volume-title":"Asian Conference on Machine Learning. PMLR, 545--560","author":"Cao Jiezhang","year":"2017","unstructured":"Jiezhang Cao , Qingyao Wu , Yuguang Yan , Li Wang , and Mingkui Tan . 2017 . On the flatness of loss surface for two-layered relu networks . In Asian Conference on Machine Learning. PMLR, 545--560 . Jiezhang Cao, Qingyao Wu, Yuguang Yan, Li Wang, and Mingkui Tan. 2017. On the flatness of loss surface for two-layered relu networks. In Asian Conference on Machine Learning. PMLR, 545--560."},{"key":"e_1_3_2_1_7_1","volume-title":"Proceedings of the International Conference on Learning Representations. 1--14","author":"Clevert Djork-Arn\u00e9","year":"2016","unstructured":"Djork-Arn\u00e9 Clevert , Thomas Unterthiner , and Sepp Hochreiter . 2016 . Fast and accurate deep network learning by exponential linear units (ELUs) . In Proceedings of the International Conference on Learning Representations. 1--14 . Djork-Arn\u00e9 Clevert, Thomas Unterthiner, and Sepp Hochreiter. 2016. Fast and accurate deep network learning by exponential linear units (ELUs). In Proceedings of the International Conference on Learning Representations. 1--14."},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1111\/j.1469-1809.1936.tb02137.x"},{"key":"e_1_3_2_1_9_1","volume-title":"Proceedings of the International Conference on Artificial Intelligence and Statistics. 249--256","author":"Glorot Xavier","year":"2010","unstructured":"Xavier Glorot and Yoshua Bengio . 2010 . Understanding the difficulty of training deep feedforward neural networks . In Proceedings of the International Conference on Artificial Intelligence and Statistics. 249--256 . Xavier Glorot and Yoshua Bengio. 2010. Understanding the difficulty of training deep feedforward neural networks. In Proceedings of the International Conference on Artificial Intelligence and Statistics. 249--256."},{"key":"e_1_3_2_1_10_1","volume-title":"Proceedings of the International Conference on Artificial Intelligence and Statistics. 315--323","author":"Glorot Xavier","year":"2011","unstructured":"Xavier Glorot , Antoine Bordes , and Yoshua Bengio . 2011 . Deep sparse rectifier neural networks . In Proceedings of the International Conference on Artificial Intelligence and Statistics. 315--323 . Xavier Glorot, Antoine Bordes, and Yoshua Bengio. 2011. Deep sparse rectifier neural networks. In Proceedings of the International Conference on Artificial Intelligence and Statistics. 315--323."},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1016\/S0893-6080(97)00134-2"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1142\/S0218488598000094"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1016\/0893-6080(89)90020-8"},{"key":"e_1_3_2_1_14_1","first-page":"611","article-title":"A survey of factors influencing MLP error surface","volume":"33","author":"Kordos Miros\u0142aw","year":"2004","unstructured":"Miros\u0142aw Kordos and Wlodzis\u0142aw Duch . 2004 . A survey of factors influencing MLP error surface . Control and Cybernetics 33 , 4 (2004), 611 -- 631 . Miros\u0142aw Kordos and Wlodzis\u0142aw Duch. 2004. A survey of factors influencing MLP error surface. Control and Cybernetics 33, 4 (2004), 611--631.","journal-title":"Control and Cybernetics"},{"key":"e_1_3_2_1_15_1","volume-title":"International conference on machine learning. PMLR, 2908--2916","author":"Laurent Thomas","year":"2018","unstructured":"Thomas Laurent and James Brecht . 2018 . The multilinear structure of ReLU networks . In International conference on machine learning. PMLR, 2908--2916 . Thomas Laurent and James Brecht. 2018. The multilinear structure of ReLU networks. In International conference on machine learning. PMLR, 2908--2916."},{"key":"e_1_3_2_1_16_1","volume-title":"MNIST handwritten digit database. AT&T Labs","author":"LeCun Yann","year":"2010","unstructured":"Yann LeCun , Corinna Cortes , and CJ Burges . 2010. MNIST handwritten digit database. AT&T Labs ( 2010 ). Yann LeCun, Corinna Cortes, and CJ Burges. 2010. MNIST handwritten digit database. AT&T Labs (2010)."},{"key":"e_1_3_2_1_17_1","volume-title":"Proceedings of the 35th International Conference on Machine Learning (Proceedings of Machine Learning Research","volume":"2843","author":"Liang Shiyu","year":"2018","unstructured":"Shiyu Liang , Ruoyu Sun , Yixuan Li , and Rayadurgam Srikant . 2018 . Understanding the Loss Surface of Neural Networks for Binary Classification . In Proceedings of the 35th International Conference on Machine Learning (Proceedings of Machine Learning Research , Vol. 80), Jennifer Dy and Andreas Krause (Eds.). PMLR, 2835-- 2843 . Shiyu Liang, Ruoyu Sun, Yixuan Li, and Rayadurgam Srikant. 2018. Understanding the Loss Surface of Neural Networks for Binary Classification. In Proceedings of the 35th International Conference on Machine Learning (Proceedings of Machine Learning Research, Vol. 80), Jennifer Dy and Andreas Krause (Eds.). PMLR, 2835--2843."},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.knosys.2021.106923"},{"volume-title":"Characterising continuous optimisation problems for particle swarm optimisation performance prediction. Ph. D. Dissertation","author":"Malan Katherine Mary","key":"e_1_3_2_1_19_1","unstructured":"Katherine Mary Malan . 2014. Characterising continuous optimisation problems for particle swarm optimisation performance prediction. Ph. D. Dissertation . University of Pretoria . Katherine Mary Malan. 2014. Characterising continuous optimisation problems for particle swarm optimisation performance prediction. Ph. D. Dissertation. University of Pretoria."},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.3390\/a14020040"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1109\/CEC.2009.4983112"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.ins.2013.04.015"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1109\/CEC.2014.6900576"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1103\/PhysRevE.97.052307"},{"key":"e_1_3_2_1_25_1","volume-title":"Piecewise strong convexity of neural networks. Advances in Neural Information Processing Systems 32","author":"Milne Tristan","year":"2019","unstructured":"Tristan Milne . 2019. Piecewise strong convexity of neural networks. Advances in Neural Information Processing Systems 32 ( 2019 ). Tristan Milne. 2019. Piecewise strong convexity of neural networks. Advances in Neural Information Processing Systems 32 (2019)."},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.ins.2015.05.010"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.5555\/3104322.3104425"},{"volume-title":"Recent Advances in Intelligent Engineering Systems","author":"Pitzer Erik","key":"e_1_3_2_1_28_1","unstructured":"Erik Pitzer and Michael Affenzeller . 2012. A comprehensive survey on fitness landscape analysis . In Recent Advances in Intelligent Engineering Systems . Springer , 161--191. Erik Pitzer and Michael Affenzeller. 2012. A comprehensive survey on fitness landscape analysis. In Recent Advances in Intelligent Engineering Systems. Springer, 161--191."},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1109\/SSCI.2015.202"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1109\/CEC.2015.7256883"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.neunet.2017.06.009"},{"key":"e_1_3_2_1_34_1","volume-title":"International Conference on Machine Learning. PMLR, 4433--4441","author":"Safran Itay","year":"2018","unstructured":"Itay Safran and Ohad Shamir . 2018 . Spurious local minima are common in two-layer relu neural networks . In International Conference on Machine Learning. PMLR, 4433--4441 . Itay Safran and Ohad Shamir. 2018. Spurious local minima are common in two-layer relu neural networks. In International Conference on Machine Learning. PMLR, 4433--4441."},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1109\/CEC.2001.934364"},{"volume-title":"Principles of random walk","author":"Spitzer Frank","key":"e_1_3_2_1_36_1","unstructured":"Frank Spitzer . 2013. Principles of random walk . Vol. 34 . Springer Science & Business Media . Frank Spitzer. 2013. Principles of random walk. Vol. 34. Springer Science & Business Media."},{"key":"e_1_3_2_1_37_1","volume-title":"Empirical evaluation of rectified activations in convolutional network. arXiv preprint arXiv:1505.00853","author":"Xu Bing","year":"2015","unstructured":"Bing Xu , Naiyan Wang , Tianqi Chen , and Mu Li. 2015. Empirical evaluation of rectified activations in convolutional network. arXiv preprint arXiv:1505.00853 ( 2015 ). Bing Xu, Naiyan Wang, Tianqi Chen, and Mu Li. 2015. Empirical evaluation of rectified activations in convolutional network. arXiv preprint arXiv:1505.00853 (2015)."}],"event":{"name":"GECCO '23 Companion: Companion Conference on Genetic and Evolutionary Computation","sponsor":["SIGEVO ACM Special Interest Group on Genetic and Evolutionary Computation"],"location":"Lisbon Portugal","acronym":"GECCO '23 Companion"},"container-title":["Proceedings of the Companion Conference on Genetic and Evolutionary Computation"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3583133.3596321","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3583133.3596321","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T17:48:54Z","timestamp":1750182534000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3583133.3596321"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,7,15]]},"references-count":35,"alternative-id":["10.1145\/3583133.3596321","10.1145\/3583133"],"URL":"https:\/\/doi.org\/10.1145\/3583133.3596321","relation":{},"subject":[],"published":{"date-parts":[[2023,7,15]]},"assertion":[{"value":"2023-07-24","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}