{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,7,16]],"date-time":"2026-07-16T20:24:51Z","timestamp":1784233491998,"version":"3.55.0"},"reference-count":61,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"12","license":[{"start":{"date-parts":[[2020,12,1]],"date-time":"2020-12-01T00:00:00Z","timestamp":1606780800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,12,1]],"date-time":"2020-12-01T00:00:00Z","timestamp":1606780800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,12,1]],"date-time":"2020-12-01T00:00:00Z","timestamp":1606780800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China (NSFC) fund","doi-asserted-by":"publisher","award":["61571259"],"award-info":[{"award-number":["61571259"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China (NSFC) fund","doi-asserted-by":"publisher","award":["61831014"],"award-info":[{"award-number":["61831014"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China (NSFC) fund","doi-asserted-by":"publisher","award":["61531014"],"award-info":[{"award-number":["61531014"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Shenzhen Science and Technology Project","award":["JCYJ20170817161916238"],"award-info":[{"award-number":["JCYJ20170817161916238"]}]},{"name":"Shenzhen Science and Technology Project","award":["JCYJ20180508152042002"],"award-info":[{"award-number":["JCYJ20180508152042002"]}]},{"name":"Shenzhen Science and Technology Project","award":["GGFW2017040714161462"],"award-info":[{"award-number":["GGFW2017040714161462"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Neural Netw. Learning Syst."],"published-print":{"date-parts":[[2020,12]]},"DOI":"10.1109\/tnnls.2019.2963066","type":"journal-article","created":{"date-parts":[[2020,1,28]],"date-time":"2020-01-28T22:38:41Z","timestamp":1580251121000},"page":"5079-5091","source":"Crossref","is-referenced-by-count":77,"title":["PID Controller-Based Stochastic Optimization Acceleration for Deep Neural Networks"],"prefix":"10.1109","volume":"31","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2792-8469","authenticated-orcid":false,"given":"Haoqian","family":"Wang","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3727-5679","authenticated-orcid":false,"given":"Yi","family":"Luo","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1869-1837","authenticated-orcid":false,"given":"Wangpeng","family":"An","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Qingyun","family":"Sun","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1602-538X","authenticated-orcid":false,"given":"Jun","family":"Xu","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2078-4215","authenticated-orcid":false,"given":"Lei","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref39","first-page":"6869","article-title":"Quantized neural networks: Training neural networks with low precision weights and activations","volume":"18","author":"hubara","year":"2017","journal-title":"J Mach Learn Res"},{"key":"ref38","article-title":"Cgap: Continuous growth and pruning for efficient deep learning","author":"du","year":"2019","journal-title":"arXiv 1905 11533"},{"key":"ref33","first-page":"1120","article-title":"Unitary evolution recurrent neural networks","author":"arjovsky","year":"2016","journal-title":"Proc 33nd Int Conf Mach Learn (ICML)"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.8.1735"},{"key":"ref31","article-title":"Generative adversarial nets","author":"goodfellow","year":"2014","journal-title":"Proc NIPS"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2012.231"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/TC.2019.2914438"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00447"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.298"},{"key":"ref34","article-title":"Deep compression: Compressing deep neural networks with pruning, trained quantization and Huffman coding","author":"han","year":"2015","journal-title":"Proc Int Conf Learn Represent (ICLR)"},{"key":"ref60","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2016.7472159"},{"key":"ref61","first-page":"1019","article-title":"A theoretically grounded application of dropout in recurrent neural networks","author":"gal","year":"2016","journal-title":"Proc Adv Neural Inf Process Syst Annu Conf Neural Inf Process Syst"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2577031"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2015.2437384"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2587642"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-7908-2604-3_16"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-015-0816-y"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/AQTR.2010.5520914"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.5772\/51314"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/70.508444"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00889"},{"key":"ref23","author":"laplace","year":"1820","journal-title":"Theorie analytique des probabilites"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2015.2491929"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1016\/0041-5553(64)90137-5"},{"key":"ref50","author":"spiegel","year":"1991","journal-title":"Advanced Mathematics"},{"key":"ref51","article-title":"An analysis of the behavior of a class of genetic adaptive systems","author":"de jong","year":"1975"},{"key":"ref59","article-title":"Recurrent batch normalization","author":"cooijmans","year":"2016","journal-title":"arXiv 1603 09025"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.634"},{"key":"ref57","article-title":"Learning multiple layers of features from tiny images","author":"krizhevsky","year":"2009"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/5.726791"},{"key":"ref55","author":"li","year":"2015","journal-title":"Tiny imagenet visual recognition challenge"},{"key":"ref54","author":"khalil","year":"1996","journal-title":"Nonlinear Systems"},{"key":"ref53","author":"robert","year":"1966","journal-title":"Table of Laplace Transforms"},{"key":"ref52","first-page":"759","article-title":"Optimum settings for automatic controllers","volume":"64","author":"ziegler","year":"1942","journal-title":"Trans ASME"},{"key":"ref10","author":"goodfellow","year":"2016","journal-title":"Deep Learning"},{"key":"ref11","first-page":"9","article-title":"Online learning and stochastic approximations","author":"bottou","year":"1998","journal-title":"Online Learning in Neural Networks"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/ITA.2018.8503173"},{"key":"ref12","article-title":"On the importance of initialization and momentum in deep learning","author":"sutskever","year":"2013","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref13","first-page":"2121","article-title":"Adaptive subgradient methods for online learning and stochastic optimization","volume":"12","author":"duchi","year":"2011","journal-title":"J Mach Learn Res"},{"key":"ref14","author":"hinton","year":"2012","journal-title":"Neural networks for machine learning lecture 6a overview of mini-batch gradient descent"},{"key":"ref15","article-title":"Adam: A method for stochastic optimization","author":"kingma","year":"2014","journal-title":"Proc Int Conf Learn Represent (ICLR)"},{"key":"ref16","volume":"2","author":"ogata","year":"1995","journal-title":"Discrete-Time Control Systems"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1137\/15M1009597"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1049\/ip-cta:19951859"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/TCST.2005.847331"},{"key":"ref4","first-page":"1269","article-title":"Exploiting linear structure within convolutional networks for efficient evaluation","author":"denton","year":"2014","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref3","article-title":"Gradient descent based optimization algorithms for deep learning models training","author":"zhang","year":"2019","journal-title":"arXiv 1903 03614"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2015.2502579"},{"key":"ref5","article-title":"Speeding up convolutional neural networks with low rank expansions","author":"jaderberg","year":"2014","journal-title":"arXiv 1405 3866"},{"key":"ref8","article-title":"Fitnets: Hints for thin deep nets","author":"romero","year":"2015","journal-title":"Proc Int Conf Learn Representations"},{"key":"ref7","article-title":"Fast convolutional nets with fbfft: A GPU performance evaluation","author":"vasilache","year":"2014","journal-title":"arXiv 1412 7580"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1016\/S0893-6080(98)00116-6"},{"key":"ref9","article-title":"An empirical analysis of the optimization of deep network loss surfaces","author":"im","year":"2017","journal-title":"Proc of the Int Conf on Learning Representations (ICLR)"},{"key":"ref46","first-page":"543","article-title":"A method of solving a convex programming problem with convergence rate o (1\/k2)","volume":"269","author":"nesterov","year":"1983","journal-title":"Sov Math Doklady"},{"key":"ref45","article-title":"Wide residual networks","author":"zagoruyko","year":"2016","journal-title":"Proc Brit Mach Vis Conf"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1111\/j.1559-3584.1922.tb04958.x"},{"key":"ref47","first-page":"270","article-title":"On governors","volume":"16","author":"maxwell","year":"1867","journal-title":"Proc Roy Soc London"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref41","article-title":"Pruning filters for efficient convnets","author":"li","year":"2016","journal-title":"arXiv 1608 08710"},{"key":"ref44","first-page":"630","article-title":"Identity mappings in deep residual networks","author":"he","year":"2016","journal-title":"Proc IEEE Eur Conf Comput Vis (ECCV)"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.243"}],"container-title":["IEEE Transactions on Neural Networks and Learning Systems"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/5962385\/9273274\/08972933.pdf?arnumber=8972933","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,4,27]],"date-time":"2022-04-27T17:19:38Z","timestamp":1651079978000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8972933\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,12]]},"references-count":61,"journal-issue":{"issue":"12"},"URL":"https:\/\/doi.org\/10.1109\/tnnls.2019.2963066","relation":{},"ISSN":["2162-237X","2162-2388"],"issn-type":[{"value":"2162-237X","type":"print"},{"value":"2162-2388","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,12]]}}}