{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,6]],"date-time":"2025-11-06T01:01:38Z","timestamp":1762390898545},"reference-count":37,"publisher":"IEEE","license":[{"start":{"date-parts":[[2020,3,1]],"date-time":"2020-03-01T00:00:00Z","timestamp":1583020800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,3,1]],"date-time":"2020-03-01T00:00:00Z","timestamp":1583020800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,3,1]],"date-time":"2020-03-01T00:00:00Z","timestamp":1583020800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020,3]]},"DOI":"10.1109\/ciss48834.2020.1570617381","type":"proceedings-article","created":{"date-parts":[[2020,5,7]],"date-time":"2020-05-07T22:27:40Z","timestamp":1588890460000},"page":"1-6","source":"Crossref","is-referenced-by-count":2,"title":["MSE-Optimal Neural Network Initialization via Layer Fusion"],"prefix":"10.1109","author":[{"given":"Ramina","family":"Ghods","sequence":"first","affiliation":[]},{"given":"Andrew S.","family":"Lan","sequence":"additional","affiliation":[]},{"given":"Tom","family":"Goldstein","sequence":"additional","affiliation":[]},{"given":"Christoph","family":"Studer","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref33","article-title":"Learning multiple layers of features from tiny images","author":"krizhevsky","year":"2009","journal-title":"Technical Repot University of Toronto Tech Rep"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1007\/s10959-010-0338-z"},{"key":"ref31","doi-asserted-by":"crossref","DOI":"10.1109\/CISS48834.2020.1570617381","article-title":"MSE-optimal neural network initialization via layer fusion","author":"ghods","year":"2020"},{"key":"ref30","first-page":"1269","article-title":"Exploiting linear structure within convolutional networks for efficient evaluation","author":"denton","year":"2014","journal-title":"Advances in Neural IInformation Processing Systems"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2018.2866979"},{"article-title":"Speech commands: A dataset for limited-vocabulary speech recognition","year":"2018","author":"warden","key":"ref36"},{"key":"ref35","first-page":"437","article-title":"A public domain dataset for human activity recognition using smartphones","author":"anguita","year":"2013","journal-title":"21th European Symposium on Artificial Neural Networks Computational Intelligence and Machine Learning (ESANN)"},{"article-title":"Fashion-MNIST: a novel image dataset for benchmarking machine learning algorithms","year":"2017","author":"xiao","key":"ref34"},{"key":"ref10","first-page":"2654","article-title":"Do deep nets really need to be deep?","author":"ba","year":"2014","journal-title":"Advances in Neural IInformation Processing Systems"},{"article-title":"Stronger generalization bounds for deep nets via a compression approach","year":"2018","author":"arora","key":"ref11"},{"key":"ref12","article-title":"Crosscorrelation functions of amplitude-distorted Gaussian signals","author":"bussgang","year":"1952","journal-title":"Technical Report M I T Cambridge MA Tech Rep 216"},{"key":"ref13","first-page":"1097","article-title":"Imagenet classification with deep convolutional neural networks","author":"krizhevsky","year":"2012","journal-title":"Advances in Neural IInformation Processing Systems"},{"key":"ref14","first-page":"249","article-title":"Understanding the difficulty of training deep feedforward neural networks","author":"glorot","year":"2010","journal-title":"Proceedings of the 13th International Conference on Artificial Intelligence and Statistics (AISTATS)"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.123"},{"article-title":"All you need is a good init","year":"2015","author":"mishkin","key":"ref16"},{"article-title":"Exact solutions to the nonlinear dynamics of learning in deep linear neural networks","year":"2013","author":"saxe","key":"ref17"},{"article-title":"Distilling the knowledge in a neural network","year":"2015","author":"hinton","key":"ref18"},{"article-title":"ExpandNet: Training compact networks by linear expansion","year":"2019","author":"guo","key":"ref19"},{"key":"ref28","first-page":"1737","article-title":"Deep learning with limited numerical precision","author":"gupta","year":"2015","journal-title":"International Conference on Machine Learning (ICML)"},{"article-title":"Understanding deep learning requires rethinking generalization","year":"2016","author":"zhang","key":"ref4"},{"key":"ref27","first-page":"3123","article-title":"Binaryconnect: Training deep neural networks with binary weights during propagations","author":"courbariaux","year":"2015","journal-title":"Advances in Neural IInformation Processing Systems"},{"article-title":"A convergence theory for deep learning via over-parameterization","year":"2018","author":"allen-zhu","key":"ref3"},{"key":"ref6","first-page":"855","article-title":"On the computational efficiency of training neural networks","author":"livni","year":"2014","journal-title":"Advances in Neural IInformation Processing Systems"},{"key":"ref29","first-page":"806","article-title":"Sparse convolutional neural networks","author":"liu","year":"2015","journal-title":"Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR)"},{"article-title":"On the optimization of deep networks: Implicit acceleration by overparameterization","year":"2018","author":"arora","key":"ref5"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00474"},{"article-title":"Mobilenets: Efficient convolutional neural networks for mobile vision applications","year":"2017","author":"howard","key":"ref7"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298594"},{"key":"ref9","first-page":"2148","article-title":"Predicting parameters in deep learning","author":"denil","year":"2013","journal-title":"Advances in Neural IInformation Processing Systems"},{"article-title":"Very deep convolutional networks for large-scale image recognition","year":"2014","author":"simonyan","key":"ref1"},{"article-title":"Deep compression: Compressing deep neural networks with pruning, trained quantization and Huffman coding","year":"2015","author":"han","key":"ref20"},{"key":"ref22","first-page":"1135","article-title":"Learning both weights and connections for efficient neural network","author":"han","year":"2015","journal-title":"Advances in Neural Information Processing Systems 13 Proceedings of the 2000 Conference"},{"key":"ref21","first-page":"1379","article-title":"Dynamic network surgery for efficient DNNs","author":"guo","year":"2016","journal-title":"Advances in Neural IInformation Processing Systems"},{"key":"ref24","first-page":"177","article-title":"Comparing biases for minimal network construction with back-propagation","author":"hanson","year":"1989","journal-title":"Advances in Neural IInformation Processing Systems"},{"key":"ref23","first-page":"164","article-title":"Second order derivatives for network pruning: Optimal brain surgeon","author":"hassibi","year":"1993","journal-title":"Advances in Neural IInformation Processing Systems"},{"article-title":"Compressing deep convolutional networks using vector quantization","year":"2014","author":"gong","key":"ref26"},{"key":"ref25","first-page":"598","article-title":"Optimal brain damage","author":"lecun","year":"1990","journal-title":"Advances in Neural IInformation Processing Systems"}],"event":{"name":"2020 54th Annual Conference on Information Sciences and Systems (CISS)","start":{"date-parts":[[2020,3,18]]},"location":"Princeton, NJ, USA","end":{"date-parts":[[2020,3,20]]}},"container-title":["2020 54th Annual Conference on Information Sciences and Systems (CISS)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9081570\/9086165\/09086241.pdf?arnumber=9086241","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,6,27]],"date-time":"2022-06-27T11:47:04Z","timestamp":1656330424000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9086241\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,3]]},"references-count":37,"URL":"https:\/\/doi.org\/10.1109\/ciss48834.2020.1570617381","relation":{},"subject":[],"published":{"date-parts":[[2020,3]]}}}