{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,2,21]],"date-time":"2025-02-21T01:06:50Z","timestamp":1740100010224,"version":"3.37.3"},"reference-count":29,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,6,6]],"date-time":"2021-06-06T00:00:00Z","timestamp":1622937600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,6,6]],"date-time":"2021-06-06T00:00:00Z","timestamp":1622937600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,6,6]],"date-time":"2021-06-06T00:00:00Z","timestamp":1622937600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,6,6]]},"DOI":"10.1109\/icassp39728.2021.9413500","type":"proceedings-article","created":{"date-parts":[[2021,5,13]],"date-time":"2021-05-13T19:53:45Z","timestamp":1620935625000},"page":"3895-3899","source":"Crossref","is-referenced-by-count":1,"title":["Inertial Proximal Deep Learning Alternating Minimization for Efficient Neutral Network Training"],"prefix":"10.1109","author":[{"given":"Linbo","family":"Qiao","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tao","family":"Sun","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hengyue","family":"Pan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dongsheng","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33014181"},{"article-title":"Fenchel lifted networks: A lagrange relaxation of neural network training","year":"2018","author":"gu","key":"ref11"},{"key":"ref12","first-page":"10","article-title":"Distributed optimization of deeply nested systems","author":"carreira-perpinan","year":"2014","journal-title":"Artificial Intelligence and Statistics"},{"key":"ref13","doi-asserted-by":"crossref","first-page":"185","DOI":"10.1007\/978-1-4419-9569-8_10","article-title":"Proximal splitting methods in signal processing","author":"combettes","year":"2011","journal-title":"Fixed-Point Algorithms For Inverse Problems in Science and Engineering"},{"key":"ref14","first-page":"807","article-title":"Rectified linear units improve restricted boltzmann machines","author":"nair","year":"2010","journal-title":"Proceedings of the 27th International Conference on Machine Learning (ICML-10)"},{"key":"ref15","first-page":"7313","article-title":"Global convergence of block coordinate descent in deep learning","author":"zeng","year":"2019","journal-title":"vol 97 of Proceedings of Machine Learning Research"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2019.8683703"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1016\/0041-5553(64)90137-5"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1137\/130942954"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1137\/16M1064064"},{"article-title":"Adadelta: an adaptive learning rate method","year":"2012","author":"zeiler","key":"ref28"},{"key":"ref4","first-page":"2722","article-title":"Training neural networks without gradients: A scalable admm approach","author":"taylor","year":"2016","journal-title":"International Conference on Machine Learning"},{"key":"ref27","first-page":"2121","article-title":"Adaptive subgradient methods for online learning and stochastic optimization","volume":"12","author":"duchi","year":"2011","journal-title":"Journal of Machine Learning Research"},{"article-title":"Gradient flow in recurrent nets: the difficulty of learning longterm dependencies","year":"2001","author":"hochreiter","key":"ref3"},{"key":"ref6","first-page":"1721","article-title":"Convergent block coordinate descent for training tikhonov regularized deep neural networks","author":"zhang","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref29","article-title":"Adam: A method for stochastic optimization","author":"kingma","year":"2014","journal-title":"ICLRE"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.165"},{"article-title":"Lifted neural networks","year":"2018","author":"askari","key":"ref8"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1145\/3292500.3330936"},{"key":"ref2","first-page":"1","article-title":"Learning representations by back-propagating errors","volume":"5","author":"rumelhart","year":"1988","journal-title":"Cognitive Modeling"},{"key":"ref9","first-page":"24","article-title":"Beyond back-prop: Alternating minimization with co-activation memory","volume":"1050","author":"choromanska","year":"2018","journal-title":"Stat"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1214\/aoms\/1177729586"},{"article-title":"Momentum and stochastic momentum for stochastic gradient, newton, proximal point and subspace descent methods","year":"2017","author":"loizou","key":"ref20"},{"key":"ref22","article-title":"Heavyball algorithms always escape saddle points","author":"sun","year":"2019","journal-title":"IJCAI"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ALLERTON.2018.8636082"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1016\/j.ins.2019.06.024"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1137\/080724265"},{"article-title":"Fashion-mnist: a novel image dataset for benchmarking machine learning algorithms","year":"2017","author":"xiao","key":"ref26"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/5.726791"}],"event":{"name":"ICASSP 2021 - 2021 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","start":{"date-parts":[[2021,6,6]]},"location":"Toronto, ON, Canada","end":{"date-parts":[[2021,6,11]]}},"container-title":["ICASSP 2021 - 2021 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9413349\/9413350\/09413500.pdf?arnumber=9413500","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,5,10]],"date-time":"2022-05-10T15:41:03Z","timestamp":1652197263000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9413500\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,6,6]]},"references-count":29,"URL":"https:\/\/doi.org\/10.1109\/icassp39728.2021.9413500","relation":{},"subject":[],"published":{"date-parts":[[2021,6,6]]}}}