{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,8]],"date-time":"2026-06-08T13:58:46Z","timestamp":1780927126384,"version":"3.54.1"},"reference-count":62,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"11","license":[{"start":{"date-parts":[[2020,11,1]],"date-time":"2020-11-01T00:00:00Z","timestamp":1604188800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,11,1]],"date-time":"2020-11-01T00:00:00Z","timestamp":1604188800000},"content-version":"am","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,11,1]],"date-time":"2020-11-01T00:00:00Z","timestamp":1604188800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,11,1]],"date-time":"2020-11-01T00:00:00Z","timestamp":1604188800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["CCF-2007668"],"award-info":[{"award-number":["CCF-2007668"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]},{"name":"NSF HDR TRIPODS","award":["#1934960"],"award-info":[{"award-number":["#1934960"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Proc. IEEE"],"published-print":{"date-parts":[[2020,11]]},"DOI":"10.1109\/jproc.2020.3023660","type":"journal-article","created":{"date-parts":[[2020,9,29]],"date-time":"2020-09-29T22:27:36Z","timestamp":1601418456000},"page":"1906-1922","source":"Crossref","is-referenced-by-count":30,"title":["Stochastic Quasi-Newton Methods"],"prefix":"10.1109","volume":"108","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-6603-0091","authenticated-orcid":false,"given":"Aryan","family":"Mokhtari","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4230-9906","authenticated-orcid":false,"given":"Alejandro","family":"Ribeiro","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1093\/imanum\/11.3.325"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1007\/BF00962795"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1093\/imamat\/7.1.21"},{"key":"ref32","doi-asserted-by":"crossref","first-page":"523","DOI":"10.2307\/2005323","article-title":"On the global convergence of Broyde&#x2019;s method","volume":"30","author":"mor\u00e9","year":"1976","journal-title":"Math Comput"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1007\/BF01589116"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.2307\/2006193"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1007\/BF01407874"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1080\/10556788.2018.1510927"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1137\/0724077"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1090\/S0025-5718-1974-0343581-1"},{"key":"ref60","first-page":"1447","article-title":"Large scale empirical risk minimization via truncated adaptive Newton method","author":"eisen","year":"2018","journal-title":"Proc Int Conf Artif Intell Statist"},{"key":"ref62","article-title":"Non-asymptotic superlinear convergence of standard quasi-Newton methods","author":"jin","year":"2020","journal-title":"arXiv 2003 13607"},{"key":"ref61","article-title":"Rates of superlinear convergence for classical quasi-Newton methods","author":"rodomanov","year":"2020","journal-title":"arXiv 2003 09174"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1137\/0801001"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1137\/0716047"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1093\/comjnl\/6.2.163"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1093\/comjnl\/13.3.317"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.2307\/2004483"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-7908-2604-3_16"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1145\/1015330.1015332"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1007\/s10107-010-0420-4"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1007\/BF01594934"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1137\/070704277"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1093\/imamat\/12.3.223"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1090\/S0025-5718-1965-0198670-6"},{"key":"ref50","first-page":"1055","article-title":"A multi-batch L-BFGS method for machine learning","author":"berahas","year":"2016","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref51","first-page":"1965","article-title":"DAve-QN: A distributed averaged quasi-Newton method with local superlinear convergence rate","author":"soori","year":"2020","journal-title":"Proc Int Conf Artif Intell Statist"},{"key":"ref59","first-page":"2060","article-title":"First-order adaptive sample size methods to reduce complexity of empirical risk minimization","author":"mokhtari","year":"2017","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref58","first-page":"4062","article-title":"Adaptive Newton method for empirical risk minimization to statistical accuracy","author":"mokhtari","year":"2016","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1137\/S1052623499354242"},{"key":"ref56","author":"sun","year":"2012","journal-title":"KDD Cup Track 2 soso com ADS Prediction Challenge"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1137\/0330046"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1080\/10556788.2018.1471141"},{"key":"ref53","article-title":"Quasi-Newton methods for deep learning: Forget the past, just sample","author":"berahas","year":"2019","journal-title":"arXiv 1901 09997"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1137\/15M1053141"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1007\/s10107-016-1030-6"},{"key":"ref11","first-page":"1646","article-title":"SAGA: A fast incremental gradient method with support for non-strongly convex composite objectives","author":"defazio","year":"2014","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1016\/S0167-6377(97)00012-6"},{"key":"ref12","first-page":"315","article-title":"Accelerating stochastic gradient descent using predictive variance reduction","author":"johnson","year":"2013","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1137\/040615961"},{"key":"ref14","first-page":"3","article-title":"Semi-stochastic gradient descent methods","volume":"2","author":"konecn?","year":"2013","journal-title":"arXiv 1312 1666"},{"key":"ref15","first-page":"980","article-title":"Linear convergence with condition number independent access of full gradients","author":"zhang","year":"2013","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1137\/15M1049695"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1137\/16M1101702"},{"key":"ref18","first-page":"249","article-title":"A linearly-convergent stochastic L-BFGS algorithm","author":"moritz","year":"2016","journal-title":"Proc Int Conf Artif Intell Statist (AISTATS)"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1137\/17M1122943"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1090\/S0025-5718-1970-0274029-X"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1090\/S0025-5718-1970-0258249-6"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/TSP.2014.2357775"},{"key":"ref5","first-page":"1737","article-title":"SGD-QN: Careful quasi-Newton stochastic gradient descent","volume":"10","author":"bordes","year":"2009","journal-title":"J Mach Learn Res"},{"key":"ref8","first-page":"3151","article-title":"Global convergence of online limited memory BFGS","volume":"16","author":"mokhtari","year":"2015","journal-title":"J Mach Learn Res"},{"key":"ref7","first-page":"436","article-title":"A stochastic quasi-Newton method for online convex optimization","author":"schraudolph","year":"2007","journal-title":"Proc Int Conf Artif Intell Statist (AISTATS)"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/CDC.2018.8619209"},{"key":"ref9","first-page":"2663","article-title":"A stochastic gradient method with an exponential convergence rate for finite training sets","author":"le roux","year":"2012","journal-title":"Proc Adv Neural Inf Process Syst"},{"key":"ref46","article-title":"A variance reduced stochastic Newton method","author":"lucchi","year":"2015","journal-title":"arXiv 1503 08316"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1137\/140954362"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/CDC.2016.7798953"},{"key":"ref47","first-page":"1869","article-title":"Stochastic block BFGS: Squeezing more curvature out of data","author":"gower","year":"2016","journal-title":"Proc Int Conf Mach Learn"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1137\/S0036142998335704"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1023\/A:1018315205474"},{"key":"ref44","author":"nocedal","year":"2006","journal-title":"Numerical Optimization"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1016\/j.cam.2006.05.018"}],"container-title":["Proceedings of the IEEE"],"original-title":[],"link":[{"URL":"https:\/\/ieeexplore.ieee.org\/ielam\/5\/9241485\/9207765-aam.pdf","content-type":"application\/pdf","content-version":"am","intended-application":"syndication"},{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/5\/9241485\/09207765.pdf?arnumber=9207765","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,4,27]],"date-time":"2022-04-27T13:39:53Z","timestamp":1651066793000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9207765\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,11]]},"references-count":62,"journal-issue":{"issue":"11"},"URL":"https:\/\/doi.org\/10.1109\/jproc.2020.3023660","relation":{},"ISSN":["0018-9219","1558-2256"],"issn-type":[{"value":"0018-9219","type":"print"},{"value":"1558-2256","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,11]]}}}