{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,13]],"date-time":"2026-01-13T05:23:11Z","timestamp":1768281791082,"version":"3.49.0"},"reference-count":50,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2024,7,1]],"date-time":"2024-07-01T00:00:00Z","timestamp":1719792000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2024,7,1]],"date-time":"2024-07-01T00:00:00Z","timestamp":1719792000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2024,7,1]],"date-time":"2024-07-01T00:00:00Z","timestamp":1719792000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-017"},{"start":{"date-parts":[[2024,7,1]],"date-time":"2024-07-01T00:00:00Z","timestamp":1719792000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"},{"start":{"date-parts":[[2024,7,1]],"date-time":"2024-07-01T00:00:00Z","timestamp":1719792000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-012"},{"start":{"date-parts":[[2024,7,1]],"date-time":"2024-07-01T00:00:00Z","timestamp":1719792000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,7,1]],"date-time":"2024-07-01T00:00:00Z","timestamp":1719792000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-004"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Applied Soft Computing"],"published-print":{"date-parts":[[2024,7]]},"DOI":"10.1016\/j.asoc.2024.111705","type":"journal-article","created":{"date-parts":[[2024,5,7]],"date-time":"2024-05-07T16:35:59Z","timestamp":1715099759000},"page":"111705","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":7,"special_numbering":"C","title":["Sparsify dynamically expandable network via variational dropout"],"prefix":"10.1016","volume":"160","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-8851-1790","authenticated-orcid":false,"given":"Yang","family":"Yang","sequence":"first","affiliation":[]},{"given":"Jie","family":"Huang","sequence":"additional","affiliation":[]},{"given":"Dexiu","family":"Hu","sequence":"additional","affiliation":[]}],"member":"78","reference":[{"issue":"4","key":"10.1016\/j.asoc.2024.111705_b1","doi-asserted-by":"crossref","first-page":"391","DOI":"10.1007\/s11023-007-9079-x","article-title":"Universal intelligence: A definition of machine intelligence","volume":"17","author":"Legg","year":"2007","journal-title":"Minds Mach."},{"key":"10.1016\/j.asoc.2024.111705_b2","first-page":"23","article-title":"A lifelong learning perspective for mobile robot control","author":"Thrun","year":"1995","journal-title":"Intell. Robot. Syst."},{"issue":"4","key":"10.1016\/j.asoc.2024.111705_b3","doi-asserted-by":"crossref","first-page":"128","DOI":"10.1016\/S1364-6613(99)01294-2","article-title":"Catastrophic forgetting in connectionist networks","volume":"3","author":"French","year":"1999","journal-title":"Trends in Cognitive Sciences"},{"key":"10.1016\/j.asoc.2024.111705_b4","doi-asserted-by":"crossref","first-page":"109","DOI":"10.1016\/S0079-7421(08)60536-8","article-title":"Catastrophic interference in connectionist networks: The sequential learning problem","volume":"24","author":"McCloskey","year":"1989","journal-title":"Psychol. Learn. Motiv."},{"issue":"7","key":"10.1016\/j.asoc.2024.111705_b5","doi-asserted-by":"crossref","first-page":"512","DOI":"10.1016\/j.tics.2016.05.004","article-title":"What learning systems do intelligent agents need? Complementary learning systems theory updated","volume":"20","author":"Kumaran","year":"2016","journal-title":"Trends in Cognitive Sciences"},{"issue":"13","key":"10.1016\/j.asoc.2024.111705_b6","doi-asserted-by":"crossref","first-page":"3521","DOI":"10.1073\/pnas.1611835114","article-title":"Overcoming catastrophic forgetting in neural networks","volume":"114","author":"Kirkpatrick","year":"2017","journal-title":"Proc. Natl. Acad. Sci."},{"key":"10.1016\/j.asoc.2024.111705_b7","first-page":"3987","article-title":"Continual learning through synaptic intelligence","volume":"vol. 70","author":"Zenke","year":"2017"},{"key":"10.1016\/j.asoc.2024.111705_b8","unstructured":"C. Nguyen, Y. Li, T. Bui, R. Turner, Variational Continual Learning, in: International Conference on Learning Representations, 2018."},{"key":"10.1016\/j.asoc.2024.111705_b9","unstructured":"E. Sayna, E. Mohamed, D. Trevor, R. Marcus, Uncertainty-guided Continual Learning with Bayesian Neural Networks, in: International Conference on Learning Representations, 2020."},{"key":"10.1016\/j.asoc.2024.111705_b10","series-title":"Advances in Neural Information Processing Systems","first-page":"26622","article-title":"Joint inference for neural network depth and dropout regularization","author":"Kishan","year":"2021"},{"key":"10.1016\/j.asoc.2024.111705_b11","doi-asserted-by":"crossref","unstructured":"V. Araujo, J. Hurtado, A. Soto, M.-F. Moens, Entropy-based Stability-Plasticity for Lifelong Learning, in: IEEE Conference on Computer Vision and Pattern Recognition Workshops, 2022, pp. 3720\u20133727.","DOI":"10.1109\/CVPRW56347.2022.00416"},{"key":"10.1016\/j.asoc.2024.111705_b12","first-page":"163","article-title":"Anti-retroactive interference for lifelong learning","volume":"vol. 13684","author":"Wang","year":"2022"},{"key":"10.1016\/j.asoc.2024.111705_b13","doi-asserted-by":"crossref","unstructured":"S. Kim, L. Noci, A. Orvieto, T. Hofmann, Achieving a Better Stability-Plasticity Trade-off via Auxiliary Networks in Continual Learning, in: IEEE Conference on Computer Vision and Pattern Recognition, 2023, pp. 11930\u201311939.","DOI":"10.1109\/CVPR52729.2023.01148"},{"key":"10.1016\/j.asoc.2024.111705_b14","doi-asserted-by":"crossref","unstructured":"Q. Gao, C. Zhao, Y. Sun, T. Xi, G. Zhang, B. Ghanem, J. Zhang, A Unified Continual Learning Framework with General Parameter-Efficient Tuning, in: IEEE International Conference on Computer Vision, 2023, pp. 11449\u201311459.","DOI":"10.1109\/ICCV51070.2023.01055"},{"key":"10.1016\/j.asoc.2024.111705_b15","series-title":"Advances in Neural Information Processing Systems","first-page":"2990","article-title":"Continual learning with deep generative replay","author":"Hanul","year":"2017"},{"key":"10.1016\/j.asoc.2024.111705_b16","series-title":"Advances in Neural Information Processing Systems","first-page":"6467","article-title":"Gradient episodic memory for continual learning","author":"Lopez-Paz","year":"2017"},{"key":"10.1016\/j.asoc.2024.111705_b17","unstructured":"A. Chaudhry, M. Ranzato, M. Rohrbach, M. Elhoseiny, Efficient Lifelong Learning with A-GEM, in: International Conference on Learning Representations, 2019."},{"key":"10.1016\/j.asoc.2024.111705_b18","first-page":"6993","article-title":"Using hindsight to anchor past knowledge in continual learning","volume":"vol. 35","author":"Chaudhry","year":"2021"},{"key":"10.1016\/j.asoc.2024.111705_b19","unstructured":"G. Saha, I. Garg, K. Roy, Gradient Projection Memory for Continual Learning, in: International Conference on Learning Representations, 2021."},{"key":"10.1016\/j.asoc.2024.111705_b20","unstructured":"L. Caccia, R. Aljundi, N. Asadi, T. Tuytelaars, J. Pineau, E. Belilovsky, New Insights on Reducing Abrupt Representation Change in Online Continual Learning, in: International Conference on Learning Representations, 2022."},{"key":"10.1016\/j.asoc.2024.111705_b21","first-page":"9677","article-title":"Continual learning with scaled gradient projection","volume":"vol. 37","author":"Saha","year":"2023"},{"key":"10.1016\/j.asoc.2024.111705_b22","article-title":"Assessor-guided learning for continual environments","volume":"640","author":"Ma\u2019sum","year":"2023","journal-title":"Inform. Sci."},{"key":"10.1016\/j.asoc.2024.111705_b23","series-title":"Progressive neural networks","author":"Rusu","year":"2016"},{"key":"10.1016\/j.asoc.2024.111705_b24","unstructured":"J. Yoon, E. Yang, J. Lee, S. Hwang, Lifelong Learning with Dynamically Expandable Networks, in: International Conference on Learning Representations, 2018."},{"key":"10.1016\/j.asoc.2024.111705_b25","series-title":"Advances in Neural Information Processing Systems","first-page":"899","article-title":"Reinforced continual learning","author":"Xu","year":"2018"},{"key":"10.1016\/j.asoc.2024.111705_b26","doi-asserted-by":"crossref","unstructured":"S. Ebrahimi, F. Meier, R. Calandra, T. Darrell, M. Rohrbach, Adversarial Continual Learning, in: European Conference on Computer Vision, 2020, pp. 386\u2013402.","DOI":"10.1007\/978-3-030-58621-8_23"},{"key":"10.1016\/j.asoc.2024.111705_b27","first-page":"6065","article-title":"Sharing less is more: Lifelong learning in deep networks with selective layer transfer","volume":"vol. 139","author":"Lee","year":"2021"},{"key":"10.1016\/j.asoc.2024.111705_b28","first-page":"5867","article-title":"Lifelong neural predictive coding: Learning cumulatively online without forgetting","volume":"vol. 35","author":"Ororbia","year":"2022"},{"key":"10.1016\/j.asoc.2024.111705_b29","doi-asserted-by":"crossref","DOI":"10.1016\/j.patcog.2021.108260","article-title":"Bayesian compression for dynamically expandable networks","volume":"122","author":"Yang","year":"2022","journal-title":"Pattern Recognit."},{"key":"10.1016\/j.asoc.2024.111705_b30","doi-asserted-by":"crossref","first-page":"165","DOI":"10.1016\/j.neunet.2023.04.005","article-title":"Lifelong learning with shared and private latent representations learned through synaptic intelligence","volume":"163","author":"Yang","year":"2023","journal-title":"Neural Netw."},{"key":"10.1016\/j.asoc.2024.111705_b31","doi-asserted-by":"crossref","unstructured":"B. Han, F. Zhao, Y. Zeng, W. Pan, G. Shen, Enhancing Efficient Continual Learning with Dynamic Structure Development of Spiking Neural Networks, in: International Joint Conference on Artificial Intelligence, 2023, pp. 2993\u20133001.","DOI":"10.24963\/ijcai.2023\/334"},{"key":"10.1016\/j.asoc.2024.111705_b32","article-title":"Improving neural networks by preventing co-adaptation of feature detectors","author":"Hinton","year":"2012","journal-title":"Tech. Rep."},{"key":"10.1016\/j.asoc.2024.111705_b33","unstructured":"C. Zhang, S. Bengio, M. Hardt, B. Recht, O. Vinyals, Understanding deep learning requires rethinking generalization, in: International Conference on Learning Representations, 2017."},{"issue":"1","key":"10.1016\/j.asoc.2024.111705_b34","first-page":"1929","article-title":"Dropout: A simple way to prevent neural networks from overfitting","volume":"15","author":"Srivastava","year":"2014","journal-title":"J. Mach. Learn. Res."},{"key":"10.1016\/j.asoc.2024.111705_b35","unstructured":"Y. Gal, Z. Ghahramani, Dropout as a bayesian approximation: Insights and applications, in: Deep Learning Workshop in ICML, 2015."},{"key":"10.1016\/j.asoc.2024.111705_b36","first-page":"2498","article-title":"Variational dropout sparsifies deep neural networks","volume":"vol. 70","author":"Molchanov","year":"2017"},{"key":"10.1016\/j.asoc.2024.111705_b37","unstructured":"S. Han, H. Mao, W. Dally, Deep Compression: Compressing Deep Neural Networks with Pruning, Trained Quantization and Huffman Coding, in: International Conference on Learning Representations, 2016."},{"key":"10.1016\/j.asoc.2024.111705_b38","doi-asserted-by":"crossref","first-page":"81","DOI":"10.1016\/j.neucom.2017.02.029","article-title":"Group sparse regularization for deep neural networks","volume":"241","author":"Scardapane","year":"2017","journal-title":"Neurocomputing"},{"key":"10.1016\/j.asoc.2024.111705_b39","first-page":"211","article-title":"Sparse Bayesian learning and the relevance vector machine","volume":"1","author":"Tipping","year":"2001","journal-title":"J. Mach. Learn. Res."},{"issue":"1","key":"10.1016\/j.asoc.2024.111705_b40","first-page":"1303","article-title":"Stochastic variational inference","volume":"14","author":"Hoffman","year":"2013","journal-title":"J. Mach. Learn. Res."},{"key":"10.1016\/j.asoc.2024.111705_b41","unstructured":"D.P. Kingma, M. Welling, Auto-Encoding Variational Bayes, in: International Conference on Learning Representations, 2014."},{"key":"10.1016\/j.asoc.2024.111705_b42","first-page":"1278","article-title":"Stochastic backpropagation and approximate inference in deep generative models","volume":"vol. 32","author":"Rezende","year":"2014"},{"key":"10.1016\/j.asoc.2024.111705_b43","doi-asserted-by":"crossref","first-page":"281","DOI":"10.1007\/s10994-023-06487-7","article-title":"Continual variational dropout: A view of auxiliary local variables in continual learning","volume":"113","author":"Hai","year":"2024","journal-title":"Mach. Learn."},{"issue":"7","key":"10.1016\/j.asoc.2024.111705_b44","doi-asserted-by":"crossref","first-page":"1649","DOI":"10.1162\/089976601750265045","article-title":"Online model selection based on the variational Bayes","volume":"13","author":"Sato","year":"2001","journal-title":"Neural Comput."},{"key":"10.1016\/j.asoc.2024.111705_b45","series-title":"Advances in Neural Information Processing Systems","first-page":"1727","article-title":"Streaming variational Bayes","author":"Broderick","year":"2013"},{"key":"10.1016\/j.asoc.2024.111705_b46","unstructured":"C. Blundell, J. Cornebise, K. Kavukcuoglu, D. Wierstra, Weight Uncertainty in Neural Networks, in: International Conference on Machine Learning, 2015."},{"issue":"8","key":"10.1016\/j.asoc.2024.111705_b47","doi-asserted-by":"crossref","first-page":"10519","DOI":"10.1109\/TPAMI.2023.3241945","article-title":"Variational nested dropout","volume":"45","author":"Cui","year":"2023","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"10.1016\/j.asoc.2024.111705_b48","series-title":"Advances in Neural Information Processing Systems","first-page":"2074","article-title":"Learning structured sparsity in deep neural networks","author":"Wen","year":"2016"},{"key":"10.1016\/j.asoc.2024.111705_b49","series-title":"Advances in Neural Information Processing Systems","first-page":"2262","article-title":"Learning the number of neurons in deep networks","author":"Alvarez","year":"2016"},{"issue":"11","key":"10.1016\/j.asoc.2024.111705_b50","doi-asserted-by":"crossref","first-page":"2278","DOI":"10.1109\/5.726791","article-title":"Gradient-based learning applied to document recognition","volume":"86","author":"Lecun","year":"1998","journal-title":"Proc. IEEE"}],"container-title":["Applied Soft Computing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1568494624004794?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1568494624004794?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2024,5,25]],"date-time":"2024-05-25T11:19:41Z","timestamp":1716635981000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S1568494624004794"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,7]]},"references-count":50,"alternative-id":["S1568494624004794"],"URL":"https:\/\/doi.org\/10.1016\/j.asoc.2024.111705","relation":{},"ISSN":["1568-4946"],"issn-type":[{"value":"1568-4946","type":"print"}],"subject":[],"published":{"date-parts":[[2024,7]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"Sparsify dynamically expandable network via variational dropout","name":"articletitle","label":"Article Title"},{"value":"Applied Soft Computing","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.asoc.2024.111705","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2024 Elsevier B.V. All rights reserved.","name":"copyright","label":"Copyright"}],"article-number":"111705"}}