{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,13]],"date-time":"2026-03-13T04:55:48Z","timestamp":1773377748402,"version":"3.50.1"},"reference-count":22,"publisher":"IEEE","license":[{"start":{"date-parts":[[2019,7,1]],"date-time":"2019-07-01T00:00:00Z","timestamp":1561939200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2019,7,1]],"date-time":"2019-07-01T00:00:00Z","timestamp":1561939200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2019,7]]},"DOI":"10.1109\/isit.2019.8849289","type":"proceedings-article","created":{"date-parts":[[2019,9,26]],"date-time":"2019-09-26T21:46:12Z","timestamp":1569534372000},"page":"1972-1976","source":"Crossref","is-referenced-by-count":4,"title":["Local Geometry of Cross Entropy Loss in Learning One-Hidden-Layer Neural Networks"],"prefix":"10.1109","author":[{"given":"Haoyu","family":"Fu","sequence":"first","affiliation":[{"name":"Dept. of ECE, The Ohio State University, Columbus, OH, 43210, USA"}]},{"given":"Yuejie","family":"Chi","sequence":"additional","affiliation":[{"name":"Dept. of ECE, Carnegie Mellon University, Pittsburgh, PA, 15213, USA"}]},{"given":"Yingbin","family":"Liang","sequence":"additional","affiliation":[{"name":"Dept. of ECE, The Ohio State University, Columbus, OH, 43210, USA"}]}],"member":"263","reference":[{"key":"ref10","article-title":"Theoretical insights into the optimization landscape of over-parameterized shallow neural networks","author":"soltanolkotabi","year":"2018","journal-title":"IEEE Transactions on Information Theory"},{"key":"ref11","article-title":"Theoretical properties of the global optimizer of two layer neural network","author":"boob","year":"2017"},{"key":"ref12","first-page":"774","article-title":"On the quality of the initial basin in overspecified neural networks","author":"safran","year":"2016","journal-title":"International Conference on Machine Learning"},{"key":"ref13","first-page":"2603","article-title":"The loss surface of deep and wide neural networks","author":"nguyen","year":"2017","journal-title":"International Conference on Machine Learning"},{"key":"ref14","article-title":"Learning one-hidden-layer neural networks with landscape design","author":"ge","year":"2018","journal-title":"International Conference on Learning Representations"},{"key":"ref15","first-page":"4433","article-title":"Spurious local minima are common in two-layer ReLU neural networks","author":"safran","year":"2018","journal-title":"Proc 35th Int Conf Mach Learn"},{"key":"ref16","article-title":"Learning one-hidden-layer relu networks via gradient descent","author":"zhang","year":"2018"},{"key":"ref17","article-title":"Nonconvex matrix factorization from rank-one measurements","author":"li","year":"2018"},{"key":"ref18","first-page":"1783","article-title":"Learning one convolutional layer with overlapping patches","author":"goel","year":"2018","journal-title":"Proc 35th Int Conf Mach Learn"},{"key":"ref19","first-page":"4836","article-title":"Porcupine neural networks: Approximating neural network landscapes","volume":"31","author":"feizi","year":"2018","journal-title":"Advances in neural information processing systems"},{"key":"ref4","first-page":"597","article-title":"Convergence analysis of two-layer neural networks with relu activation","author":"li","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref3","first-page":"4140","article-title":"Recovery guarantees for one-hidden-layer neural networks","volume":"70","author":"zhong","year":"2017","journal-title":"Proceedings of the 34th International Conference on Machine Learning"},{"key":"ref6","first-page":"605","article-title":"Globally optimal gradient descent for a ConvNet with Gaussian inputs","author":"brutzkus","year":"2017","journal-title":"Proceedings of the 34th International Conference on Machine Learning"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1214\/17-AOS1637"},{"key":"ref8","article-title":"When is a convolutional filter easy to learn*","author":"du","year":"2018","journal-title":"International Conference on Learning Representations"},{"key":"ref7","first-page":"3966","article-title":"Learning compact neural networks with regularization","author":"oymak","year":"2018","journal-title":"Proc 35th Int Conf Mach Learn"},{"key":"ref2","first-page":"2007","article-title":"Learning relus via gradient descent","volume":"30","author":"soltanolkotabi","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref1","article-title":"On the connection between learning two-layers neural networks and tensor decomposition","author":"mondelli","year":"2018"},{"key":"ref9","article-title":"Local geometry of one-hidden-layer neural networks for logistic regression","author":"fu","year":"2018"},{"key":"ref20","article-title":"A convergence theory for deep learning via over-parameterization","author":"allen-zhu","year":"2018"},{"key":"ref22","article-title":"Stochastic gradient descent optimizes over-parameterized deep relu networks","author":"zou","year":"2018"},{"key":"ref21","article-title":"Gradient descent finds global minima of deep neural networks","author":"du","year":"2018"}],"event":{"name":"2019 IEEE International Symposium on Information Theory (ISIT)","location":"Paris, France","start":{"date-parts":[[2019,7,7]]},"end":{"date-parts":[[2019,7,12]]}},"container-title":["2019 IEEE International Symposium on Information Theory (ISIT)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/8827389\/8849208\/08849289.pdf?arnumber=8849289","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,12]],"date-time":"2026-03-12T20:35:03Z","timestamp":1773347703000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8849289\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,7]]},"references-count":22,"URL":"https:\/\/doi.org\/10.1109\/isit.2019.8849289","relation":{},"subject":[],"published":{"date-parts":[[2019,7]]}}}