{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,14]],"date-time":"2026-02-14T03:02:20Z","timestamp":1771038140423,"version":"3.50.1"},"reference-count":42,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2022,4,30]],"date-time":"2022-04-30T00:00:00Z","timestamp":1651276800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2022,4,30]],"date-time":"2022-04-30T00:00:00Z","timestamp":1651276800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"the Strategic Cooperation Technology Projects of CNPC and CUPB","award":["ZLZX2020-03"],"award-info":[{"award-number":["ZLZX2020-03"]}]},{"name":"the National Key Research and Development Project","award":["2019YFA0708304"],"award-info":[{"award-number":["2019YFA0708304"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Appl Intell"],"published-print":{"date-parts":[[2023,1]]},"DOI":"10.1007\/s10489-022-03515-2","type":"journal-article","created":{"date-parts":[[2022,5,2]],"date-time":"2022-05-02T18:02:42Z","timestamp":1651514562000},"page":"1619-1639","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":13,"title":["A novel second-order learning algorithm based attention-LSTM model for dynamic chemical process modeling"],"prefix":"10.1007","volume":"53","author":[{"given":"Baochang","family":"Xu","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7168-5399","authenticated-orcid":false,"given":"Yaxin","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Likun","family":"Yuan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Chaonong","family":"Xu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2022,4,30]]},"reference":[{"key":"3515_CR1","volume-title":"Processing identification","author":"CZ Fang","year":"1988","unstructured":"Fang CZ, Xiao DY (1988) Processing identification. Tsinghua University Press, Beijing"},{"key":"3515_CR2","doi-asserted-by":"publisher","first-page":"19","DOI":"10.1016\/j.compchemeng.2013.03.029","volume":"55","author":"YAW Shardt","year":"2013","unstructured":"Shardt YAW, Huang B (2013) Data quality assessment of routine operating data for process identification. Comput Chem Eng 55:19\u201327. https:\/\/doi.org\/10.1016\/j.compchemeng.2013.03.029","journal-title":"Comput Chem Eng"},{"key":"3515_CR3","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S Hochreiter","year":"1997","unstructured":"Hochreiter S, Schmidhuber J (1997) Long short-term memory. Neural Comput 9:1735\u20131780. https:\/\/doi.org\/10.1162\/neco.1997.9.8.1735","journal-title":"Neural Comput"},{"key":"3515_CR4","doi-asserted-by":"crossref","unstructured":"Ke WS, Huang DX, Yang F, Jiang YH (2017) Soft sensor development and applications based on LSTM in deep neural networks. In: IEEE symposium series on computational intelligence (SSCI), pp 1\u20136","DOI":"10.1109\/SSCI.2017.8280954"},{"key":"3515_CR5","doi-asserted-by":"publisher","first-page":"64","DOI":"10.1016\/j.neucom.2019.08.006","volume":"367","author":"X Zhang","year":"2019","unstructured":"Zhang X, Zou YY, Li SY, Xu SH (2019) A weighted auto regressive LSTM based approach for chemical processes modeling. Neurocomputing 367:64\u201374. https:\/\/doi.org\/10.1016\/j.neucom.2019.08.006","journal-title":"Neurocomputing"},{"key":"3515_CR6","doi-asserted-by":"publisher","unstructured":"Wang Y (2017) A new concept using LSTM neural networks for dynamic system identification. In: American control conference (ACC) pp 5324\u20135329. https:\/\/doi.org\/10.23919\/ACC.2017.7963782","DOI":"10.23919\/ACC.2017.7963782"},{"key":"3515_CR7","doi-asserted-by":"publisher","first-page":"2700","DOI":"10.1109\/TII.2018.2869899","volume":"15","author":"Q Sun","year":"2019","unstructured":"Sun Q, Ge Z (2019) Probabilistic sequential network for deep learning of complex process data and soft sensor application. IEEE Trans Ind Inform 15:2700\u20132709. https:\/\/doi.org\/10.1109\/TII.2018.2869899","journal-title":"IEEE Trans Ind Inform"},{"key":"3515_CR8","doi-asserted-by":"publisher","first-page":"7233","DOI":"10.1109\/TII.2018.2880968","volume":"16","author":"K Wang","year":"2018","unstructured":"Wang K, Gopaluni B, Chen J, Song Z (2018) Deep learning of complex batch process data and its application on quality prediction. IEEE Trans Ind Inform 16:7233\u20137242. https:\/\/doi.org\/10.1109\/TII.2018.2880968","journal-title":"IEEE Trans Ind Inform"},{"key":"3515_CR9","doi-asserted-by":"publisher","first-page":"1669","DOI":"10.1007\/s10489-020-01890-2","volume":"51","author":"BR Preeti","year":"2021","unstructured":"Preeti BR, Dagar A, Singh RP (2021) A novel online sequential extreme learning machine with L2,1-norm regularization for prediction problems. Appl Intell 51:1669\u20131689. https:\/\/doi.org\/10.1007\/s10489-020-01890-2","journal-title":"Appl Intell"},{"key":"3515_CR10","doi-asserted-by":"publisher","first-page":"887","DOI":"10.1007\/s11222-020-09924-y","volume":"30","author":"LF Ye","year":"2020","unstructured":"Ye LF, Beskos A, Iorio MD, Hao J (2020) Monte Carlo co-ordinate ascent variational inference. Stat Comput 30:887\u2013905. https:\/\/doi.org\/10.1007\/s11222-020-09924-y","journal-title":"Stat Comput"},{"key":"3515_CR11","doi-asserted-by":"publisher","first-page":"223","DOI":"10.1137\/16M1080173","volume":"60","author":"L Bottou","year":"2016","unstructured":"Bottou L, Curtis FE, Nocedal J (2016) Optimization methods for large-scale machine learning. SIAM Rev 60:223\u2013311. https:\/\/doi.org\/10.1137\/16M1080173","journal-title":"SIAM Rev"},{"key":"3515_CR12","doi-asserted-by":"publisher","first-page":"621","DOI":"10.1007\/s12190-019-01300-y","volume":"62","author":"P Zhang","year":"2020","unstructured":"Zhang P (2020) A regularization Newton method based on the generalized Fischer\u2013Burmeister smoothing function for the NCP. J Appl Math Comput 62:621\u2013635. https:\/\/doi.org\/10.1007\/s12190-019-01300-y","journal-title":"J Appl Math Comput"},{"key":"3515_CR13","doi-asserted-by":"publisher","unstructured":"An AM, Han KJ, Zhu L, Chen L, Liang R (2017) Networked distributed model predictive control for multi-variable coupling process. In: eighth international conference on intelligent control and information processing (ICICIP) pp 272\u2013277. https:\/\/doi.org\/10.1109\/ICICIP.2017.8113954","DOI":"10.1109\/ICICIP.2017.8113954"},{"key":"3515_CR14","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.sysconle.2019.104601","volume":"136","author":"H Komatsua","year":"2020","unstructured":"Komatsua H, Nakajimab H (2020) The deficiency zero theorem and global asymptotic stability for a class of chemical reaction networks with arbitrary time delays. Syst Control Lett 136:1\u201310. https:\/\/doi.org\/10.1016\/j.sysconle.2019.104601","journal-title":"Syst Control Lett"},{"key":"3515_CR15","doi-asserted-by":"publisher","first-page":"348","DOI":"10.1016\/j.neucom.2020.04.110","volume":"403","author":"YK Ding","year":"2020","unstructured":"Ding YK, Zhu YL, Feng J, Zhang PC, Cheng ZR (2020) Interpretable spatio-temporal attention LSTM model for flood forecasting. Neurocomputing 403:348\u2013359. https:\/\/doi.org\/10.1016\/j.neucom.2020.04.110","journal-title":"Neurocomputing"},{"key":"3515_CR16","doi-asserted-by":"publisher","first-page":"148","DOI":"10.1109\/TNNLS.2019.2899936","volume":"31","author":"SM Yang","year":"2019","unstructured":"Yang SM, Deng B, Wang J, Li H, Lu M, Che Y, Wei X, Loparo KA (2019) Scalable digital neuromorphic architecture for large-scale biophysically meaningful neural network with multi-compartment neurons. IEEE Trans Neural Netw Learn Syst 31:148\u2013162. https:\/\/doi.org\/10.1109\/TNNLS.2019.2899936","journal-title":"IEEE Trans Neural Netw Learn Syst"},{"key":"3515_CR17","doi-asserted-by":"publisher","unstructured":"Yang SM, Wang J, Zhang N et al (2021) CerebelluMorphic: large-scale neuromorphic model and architecture for supervised motor learning. IEEE Trans Neural Netw Learn Syst:1\u201315. https:\/\/doi.org\/10.1109\/TNNLS.2021.3057070","DOI":"10.1109\/TNNLS.2021.3057070"},{"key":"3515_CR18","doi-asserted-by":"publisher","first-page":"601109","DOI":"10.3389\/fnins.2021.601109","volume":"15","author":"SM Yang","year":"2021","unstructured":"Yang SM, Gao T, Wang J, Deng B, Lansdell B, Linares-Barranco B (2021) Efficient spike-driven learning with dendritic event-based processing. Front Neurosci 15:601109. https:\/\/doi.org\/10.3389\/fnins.2021.601109","journal-title":"Front Neurosci"},{"key":"3515_CR19","doi-asserted-by":"publisher","unstructured":"Yang SM, Wang J, Deng B, Azghadi MR, Linares-Barranco B (2021) Neuromorphic context-dependent learning framework with fault-tolerant spike routing. IEEE Trans Neural Netw Learn Syst:1\u201315. https:\/\/doi.org\/10.1109\/TNNLS.2021.3084250","DOI":"10.1109\/TNNLS.2021.3084250"},{"key":"3515_CR20","doi-asserted-by":"publisher","unstructured":"Wilfred KJN, Sreeraj S, Vijay B, Bagyaveereswaran V (2015) System identification using artificial neural network. In: International conference on circuits, power and computing technologies (ICCPCT), pp 1\u20134. https:\/\/doi.org\/10.1109\/ICCPCT.2015.7159360","DOI":"10.1109\/ICCPCT.2015.7159360"},{"key":"3515_CR21","doi-asserted-by":"publisher","first-page":"2212","DOI":"10.1007\/s10489-021-02442-y","volume":"52","author":"Y Yang","year":"2021","unstructured":"Yang Y, Fan CJ, Xiong HL (2021) A novel general-purpose hybrid model for time series forecasting. Appl Intell 52:2212\u20132223. https:\/\/doi.org\/10.1007\/s10489-021-02442-y","journal-title":"Appl Intell"},{"key":"3515_CR22","doi-asserted-by":"publisher","first-page":"114072","DOI":"10.1016\/j.applthermaleng.2019.114072","volume":"160","author":"YM Han","year":"2019","unstructured":"Han YM, Fan CY, Xu M, Geng ZQ, Zhong YH (2019) Production capacity analysis and energy saving of complex chemical processes using LSTM based on attention mechanism. Appl Therm Eng 160:114072. https:\/\/doi.org\/10.1016\/j.applthermaleng.2019.114072","journal-title":"Appl Therm Eng"},{"key":"3515_CR23","doi-asserted-by":"publisher","first-page":"185","DOI":"10.1016\/0925-2312(93)90006-O","volume":"5","author":"S Amari","year":"1993","unstructured":"Amari S (1993) Backpropagation and stochastic gradient descent method. Neurocomputing 5:185\u2013196. https:\/\/doi.org\/10.1016\/0925-2312(93)90006-O","journal-title":"Neurocomputing"},{"key":"3515_CR24","doi-asserted-by":"publisher","unstructured":"Senior A, Heigold G, Ranzato M, Yang K (2013) An empirical study of learning rates in deep neural networks for speech recognition. In: IEEE international conference on acoustics, speech and signal processing (ICASSP), pp 6724\u20136728. https:\/\/doi.org\/10.1109\/ICASSP.2013.6638963","DOI":"10.1109\/ICASSP.2013.6638963"},{"key":"3515_CR25","doi-asserted-by":"publisher","first-page":"74","DOI":"10.1016\/j.neucom.2015.12.076","volume":"186","author":"SS Liew","year":"2016","unstructured":"Liew SS, Khalil-Hani M, Bakhteri R (2016) An optimized second order stochastic learning algorithm for neural network training. Neurocomputing 186:74\u201389. https:\/\/doi.org\/10.1016\/j.neucom.2015.12.076","journal-title":"Neurocomputing"},{"key":"3515_CR26","doi-asserted-by":"publisher","unstructured":"Hadgu AT, Nigam A, Diaz-Aviles E (2015) Large-scale learning with AdaGrad on spark. In: IEEE International Conference on Big Data, pp 2828\u20132830. https:\/\/doi.org\/10.1109\/BigData.2015.7364091","DOI":"10.1109\/BigData.2015.7364091"},{"key":"3515_CR27","unstructured":"Zeiler MD (2012) ADADELTA: an adaptive learning rate method arXiv: 1212.5701"},{"key":"3515_CR28","doi-asserted-by":"publisher","first-page":"253","DOI":"10.1016\/j.neucom.2004.11.016","volume":"64","author":"AD Anastasiadisa","year":"2005","unstructured":"Anastasiadisa AD, Magoulasa GD, Vrahatis MN (2005) New globally convergent training scheme based on the resilient propagation algorithm. Neurocomputing 64:253\u2013270. https:\/\/doi.org\/10.1016\/j.neucom.2004.11.016","journal-title":"Neurocomputing"},{"key":"3515_CR29","doi-asserted-by":"publisher","first-page":"135","DOI":"10.1007\/s10107-012-0514-2","volume":"141","author":"AS Lewis","year":"2013","unstructured":"Lewis AS, Overton ML (2013) Nonsmooth optimization via quasi-Newton methods. Math Program 141:135\u2013163. https:\/\/doi.org\/10.1007\/s10107-012-0514-2","journal-title":"Math Program"},{"key":"3515_CR30","doi-asserted-by":"publisher","first-page":"15","DOI":"10.1016\/S0377-0427(00)00540-9","volume":"129","author":"DH Li","year":"2001","unstructured":"Li DH, Fukushima M (2001) A modified BFGS method and its global convergence in nonconvex minimization. J Comput Appl Math 129:15\u201335","journal-title":"J Comput Appl Math"},{"key":"3515_CR31","doi-asserted-by":"publisher","first-page":"6669","DOI":"10.1007\/s00521-019-04689-6","volume":"32","author":"IE Livieris","year":"2020","unstructured":"Livieris IE (2020) An advanced active set L-BFGS algorithm for training weight-constrained neural networks. Neural Comput Appl 32:6669\u20136684. https:\/\/doi.org\/10.1007\/s00521-019-04689-6","journal-title":"Neural Comput Appl"},{"key":"3515_CR32","unstructured":"Zhang YM, Bai SL (2011) A novel adaptive filter algorithm based on DFP technique. In: Proceedings of the 30th Chinese control conference (CCC), pp 1688\u20131691"},{"key":"3515_CR33","doi-asserted-by":"publisher","first-page":"106","DOI":"10.1137\/050624935","volume":"18","author":"S Gratton","year":"2007","unstructured":"Gratton S, Lawless AS, Nichols NK (2007) Approximate gauss\u2013Newton methods for nonlinear least squares problems. SIAM J Optim 18:106\u2013132. https:\/\/doi.org\/10.1137\/050624935","journal-title":"SIAM J Optim"},{"key":"3515_CR34","doi-asserted-by":"publisher","first-page":"1237","DOI":"10.1007\/s00521-017-3156-8","volume":"31","author":"MJ Rana","year":"2019","unstructured":"Rana MJ, Shahriar MS, Shafiullah M (2019) Levenberg\u2013Marquardt neural network to estimate UPFC-coordinated PSS parameters to enhance power system stability. Neural Comput Appl 31:1237\u20131248. https:\/\/doi.org\/10.1007\/s00521-017-3156-8","journal-title":"Neural Comput Appl"},{"key":"3515_CR35","unstructured":"Gupta V, Koren T, Singer Y (2018) Shampoo: preconditioned stochastic tensor optimization. arXiv: 1802.09568v2"},{"key":"3515_CR36","doi-asserted-by":"publisher","first-page":"545","DOI":"10.1093\/imanum\/dry009","volume":"39","author":"R Bollapragada","year":"2016","unstructured":"Bollapragada R, Byrd RH, Nocedal J (2016) Exact and inexact subsampled Newton methods for optimization. IMA J Numer Anal 39:545\u2013578. https:\/\/doi.org\/10.1093\/imanum\/dry009","journal-title":"IMA J Numer Anal"},{"key":"3515_CR37","first-page":"1","volume":"18","author":"N Agarwal","year":"2017","unstructured":"Agarwal N, Bullins B, Hazan E (2017) Second-order stochastic optimization for machine learning in linear time. J Mach Learn Res 18:1\u201340","journal-title":"J Mach Learn Res"},{"key":"3515_CR38","doi-asserted-by":"publisher","unstructured":"Li C, Zhang X, Qaosar M, Ahmed S, Alam KMR, Morimoto Y (2019) Multi-factor based stock Price prediction using hybrid neural networks with attention mechanism. In: IEEE Intl Conf on dependable, autonomic and secure computing (DASC), pp 961\u2013966. https:\/\/doi.org\/10.1109\/DASC\/PiCom\/CBDCom\/CyberSciTech.2019.00176","DOI":"10.1109\/DASC\/PiCom\/CBDCom\/CyberSciTech.2019.00176"},{"key":"3515_CR39","doi-asserted-by":"publisher","first-page":"4381","DOI":"10.1007\/s10489-020-02143-y","volume":"51","author":"XY He","year":"2021","unstructured":"He XY, Shi SX, Geng XL, Xu LY, Zhang XL (2021) Spatial-temporal attention network for multistep-ahead forecasting of chlorophyll. Appl Intell 51:4381\u20134393. https:\/\/doi.org\/10.1007\/s10489-020-02143-y","journal-title":"Appl Intell"},{"key":"3515_CR40","doi-asserted-by":"publisher","first-page":"7915","DOI":"10.1007\/s00521-019-04301-x","volume":"32","author":"MY Chen","year":"2020","unstructured":"Chen MY, Chiang HS, Sangaiah AK, Hsieh TC (2020) Recurrent neural network with attention mechanism for language model. Neural Comput Appl 32:7915\u20137923. https:\/\/doi.org\/10.1007\/s00521-019-04301-x","journal-title":"Neural Comput Appl"},{"key":"3515_CR41","doi-asserted-by":"publisher","first-page":"44","DOI":"10.1007\/s10489-018-1206-2","volume":"49","author":"X Wu","year":"2019","unstructured":"Wu X, Du ZK, Guo YK, Fujita H (2019) Hierarchical attention based long short-term memory for Chinese lyric generation. Appl Intell 49:44\u201352. https:\/\/doi.org\/10.1007\/s10489-018-1206-2","journal-title":"Appl Intell"},{"key":"3515_CR42","doi-asserted-by":"publisher","first-page":"106508","DOI":"10.1016\/j.knosys.2020.106508","volume":"211","author":"JC Li","year":"2021","unstructured":"Li JC, Yang B, Li HG, Wang YJ, Qi C, Liu Y (2021) DTDR\u2013ALSTM: extracting dynamic time-delays to reconstruct multivariate data for improving attention-based LSTM industrial time series prediction models. Knowl Based Syst 211:106508. https:\/\/doi.org\/10.1016\/j.knosys.2020.106508","journal-title":"Knowl Based Syst"}],"container-title":["Applied Intelligence"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-022-03515-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10489-022-03515-2\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10489-022-03515-2.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,4]],"date-time":"2023-01-04T04:45:19Z","timestamp":1672807519000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10489-022-03515-2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,4,30]]},"references-count":42,"journal-issue":{"issue":"2","published-print":{"date-parts":[[2023,1]]}},"alternative-id":["3515"],"URL":"https:\/\/doi.org\/10.1007\/s10489-022-03515-2","relation":{},"ISSN":["0924-669X","1573-7497"],"issn-type":[{"value":"0924-669X","type":"print"},{"value":"1573-7497","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,4,30]]},"assertion":[{"value":"15 March 2022","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"30 April 2022","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"We declare that we have no potential competing interests in our paper. All authors have seen the manuscript and approved to submit to your journal. We confirm that the content of the manuscript has not been published or submitted for publication elsewhere.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}