{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,31]],"date-time":"2025-12-31T12:11:50Z","timestamp":1767183110250,"version":"3.28.0"},"reference-count":31,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,1,8]],"date-time":"2024-01-08T00:00:00Z","timestamp":1704672000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,1,8]],"date-time":"2024-01-08T00:00:00Z","timestamp":1704672000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,1,8]]},"DOI":"10.1109\/ccwc60891.2024.10427781","type":"proceedings-article","created":{"date-parts":[[2024,2,13]],"date-time":"2024-02-13T23:35:29Z","timestamp":1707867329000},"page":"0414-0420","source":"Crossref","is-referenced-by-count":3,"title":["Multiple Gain Adaptations for Improved Neural Networks Training"],"prefix":"10.1109","author":[{"given":"Jeshwanth","family":"Challagundla","sequence":"first","affiliation":[{"name":"The University of Texas at Arlington,Department of Electrical Engineering,Arlington,Texas"}]},{"given":"Kanishka","family":"Tyagi","sequence":"additional","affiliation":[{"name":"The University of Texas at Arlington,Department of Electrical Engineering,Arlington,Texas"}]},{"given":"Tushar","family":"Chugh","sequence":"additional","affiliation":[{"name":"Carnegie Mellon University,School of Computer Science,Pittsburgh,USA"}]},{"given":"Michael","family":"Manry","sequence":"additional","affiliation":[{"name":"The University of Texas at Arlington,Department of Electrical Engineering,Arlington,Texas"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1016\/0893-6080(89)90020-8"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/72.80266"},{"article-title":"Adam: A method for stochastic optimization","year":"2014","author":"Kingma","key":"ref3"},{"article-title":"Adadelta: An adaptive learning rate method","year":"2012","author":"Zeiler","key":"ref4"},{"key":"ref5","first-page":"2121","article-title":"Adaptive subgradient methods for online learning and stochastic optimization","volume":"12","author":"Duchi","year":"2011","journal-title":"Journal of Machine Learning Research"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.2017.7966082"},{"volume-title":"Pattern classification.","year":"2012","author":"Duda","key":"ref7"},{"key":"ref8","first-page":"4596","article-title":"Adafactor: Adaptive learning rates with sublinear memory cost","volume-title":"International Conference on Machine Learning","author":"Shazeer"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-19-5443-6_21"},{"article-title":"Large batch optimization for deep learning: Training bert in 76 minutes","year":"2019","author":"You","key":"ref10"},{"article-title":"Bert: Pre-training of deep bidirectional transformers for language understanding","year":"2018","author":"Devlin","key":"ref11"},{"key":"ref12","first-page":"38801","article-title":"Slamb: accelerated large batch training with sparse communication","volume-title":"International Conference on Machine Learning","author":"Xu"},{"article-title":"Symbolic discovery of optimization algorithms","year":"2023","author":"Chen","key":"ref13"},{"key":"ref14","first-page":"1842","article-title":"Shampoo: Preconditioned stochastic tensor optimization","volume-title":"International Conference on Machine Learning","author":"Gupta"},{"article-title":"Scalable second order optimization for deep learning","year":"2020","author":"Anil","key":"ref15"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i12.17275"},{"issue":"1","key":"ref17","first-page":"30","article-title":"Adaptive multiple optimal learning factors for neural network training","volume-title":"M.S. Thesis\/Dissertation","volume":"1","author":"Challagundla","year":"2015"},{"key":"ref18","article-title":"Pattern recognition","volume":"128","author":"Bishop","year":"2006","journal-title":"Machine Learning"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1145\/1273496.1273556"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1016\/B978-0-12-824054-0.00004-6"},{"article-title":"Two-stage second order training in feedforward neural networks","volume-title":"FLAIRS Conference","author":"Robinson","key":"ref21"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1007\/s11063-019-10116-7"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.2013.6706919"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.6028\/jres.049.044"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1049\/ip-g-2.1992.0050"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1090\/qam\/10666"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1016\/0893-6080(88)90003-2"},{"key":"ref28","volume-title":"Neural networks and learning machines","volume":"3","author":"Haykin","year":"2009"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.2011.6033557"},{"article-title":"Classification data files","volume-title":"Image Processing and Neural Networks Lab, The University of Texas Arlington","year":"2022","key":"ref30"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2014.08.043"}],"event":{"name":"2024 IEEE 14th Annual Computing and Communication Workshop and Conference (CCWC)","start":{"date-parts":[[2024,1,8]]},"location":"Las Vegas, NV, USA","end":{"date-parts":[[2024,1,10]]}},"container-title":["2024 IEEE 14th Annual Computing and Communication Workshop and Conference (CCWC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10426790\/10427556\/10427781.pdf?arnumber=10427781","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,3]],"date-time":"2024-03-03T14:38:40Z","timestamp":1709476720000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10427781\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,1,8]]},"references-count":31,"URL":"https:\/\/doi.org\/10.1109\/ccwc60891.2024.10427781","relation":{},"subject":[],"published":{"date-parts":[[2024,1,8]]}}}