{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,13]],"date-time":"2026-01-13T21:52:27Z","timestamp":1768341147407,"version":"3.49.0"},"publisher-location":"New York, NY, USA","reference-count":43,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,6,3]],"date-time":"2024-06-03T00:00:00Z","timestamp":1717372800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,6,3]]},"DOI":"10.1145\/3659914.3659915","type":"proceedings-article","created":{"date-parts":[[2024,5,15]],"date-time":"2024-05-15T14:13:51Z","timestamp":1715782431000},"page":"1-11","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":1,"title":["Towards Sobolev Pruning"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0009-8901-6714","authenticated-orcid":false,"given":"Neil","family":"Kichler","sequence":"first","affiliation":[{"name":"RWTH Aachen University, Aachen, Germany"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2870-8038","authenticated-orcid":false,"given":"Sher","family":"Afghan","sequence":"additional","affiliation":[{"name":"RWTH Aachen University, Aachen, Germany"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7518-5922","authenticated-orcid":false,"given":"Uwe","family":"Naumann","sequence":"additional","affiliation":[{"name":"RWTH Aachen University, Aachen, Germany"}]}],"member":"320","published-online":{"date-parts":[[2024,6,3]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"Sobolev spaces","author":"Adams Robert A","unstructured":"Robert A Adams and John Fournier. 2003. Sobolev spaces (2nd ed.). Pure and Applied Mathematics, Vol. 140. Academic Press.","edition":"2"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-50420-5_27"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-0-387-69033-9"},{"key":"e_1_3_2_1_4_1","volume-title":"Pattern Recognition and Machine Learning","author":"Bishop Christopher M.","unstructured":"Christopher M. Bishop. 2006. Pattern Recognition and Machine Learning. Springer-Verlag, Berlin, Heidelberg. https:\/\/www.microsoft.com\/en-us\/research\/people\/cmbishop\/prml-book\/"},{"key":"e_1_3_2_1_5_1","volume-title":"Proceedings of the Eighteenth International Conference on Artificial Intelligence and Statistics (IASTATS)","volume":"38","author":"Choromanska Anna","year":"2015","unstructured":"Anna Choromanska, MIkael Henaff, Michael Mathieu, Gerard Ben Arous, and Yann LeCun. 2015. The Loss Surfaces of Multilayer Networks. In Proceedings of the Eighteenth International Conference on Artificial Intelligence and Statistics (IASTATS), Vol. 38. PMLR, 192--204. arXiv:1412.0233"},{"key":"e_1_3_2_1_6_1","unstructured":"Marc Claesen and Bart De Moor. 2015. Hyperparameter Search in Machine Learning. (2015). arXiv:1502.02127"},{"key":"e_1_3_2_1_7_1","unstructured":"Wojciech M Czarnecki Simon Osindero Max Jaderberg Grzegorz Swirszcz and Razvan Pascanu. 2017. Sobolev training for neural networks. Advances in Neural Information Processing Systems 30. arXiv:1706.04859"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1109\/TC.2019.2914438"},{"key":"e_1_3_2_1_9_1","volume-title":"Advances in Neural Information Processing Systems","volume":"27","author":"Dauphin Yann N","year":"2014","unstructured":"Yann N Dauphin, Razvan Pascanu, Caglar Gulcehre, Kyunghyun Cho, Surya Ganguli, and Yoshua Bengio. 2014. Identifying and attacking the saddle point problem in high-dimensional non-convex optimization. In Advances in Neural Information Processing Systems, Vol. 27. arXiv:1406.2572"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.3233\/978-1-61499-621-7-731"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1109\/72.963775"},{"key":"e_1_3_2_1_12_1","volume-title":"Advances in Neural Information Processing Systems","volume":"31","author":"Figurnov Mikhail","year":"2018","unstructured":"Mikhail Figurnov, Shakir Mohamed, and Andriy Mnih. 2018. Implicit Reparameterization Gradients. In Advances in Neural Information Processing Systems, Vol. 31. arXiv:1805.08498"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-0-387-21617-1"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1137\/1.9780898717761"},{"key":"e_1_3_2_1_15_1","volume-title":"Advances in Neural Information Processing Systems","volume":"28","author":"Han Song","year":"2015","unstructured":"Song Han, Jeff Pool, John Tran, and William Dally. 2015. Learning both Weights and Connections for Efficient Neural Network. In Advances in Neural Information Processing Systems, Vol. 28. arXiv:1506.02626"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICNN.1993.298572"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.155"},{"key":"e_1_3_2_1_19_1","volume-title":"Differential Machine Learning. Risk (9","author":"Huge Brian Norsk","year":"2020","unstructured":"Brian Norsk Huge and Antoine Savine. 2020. Differential Machine Learning. Risk (9 2020). arXiv:2005.02347"},{"key":"e_1_3_2_1_20_1","unstructured":"Neil Kichler. 2023. Second-Order Differential ML. Master's thesis. RWTH Aachen."},{"key":"e_1_3_2_1_21_1","volume-title":"Adam: A Method for Stochastic Optimization. In 3rd International Conference on Learning Representations, Yoshua Bengio and Yann LeCun (Eds.). arXiv:1412","author":"Diederik","unstructured":"Diederik P. Kingma and Jimmy Ba. 2015. Adam: A Method for Stochastic Optimization. In 3rd International Conference on Learning Representations, Yoshua Bengio and Yann LeCun (Eds.). arXiv:1412.6980"},{"key":"e_1_3_2_1_22_1","unstructured":"Diederik P Kingma and Max Welling. 2013. Auto-Encoding Variational Bayes. arXiv:1312.6114"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1038\/nature14539"},{"key":"e_1_3_2_1_24_1","unstructured":"Yann LeCun John Denker and Sara Solla. 1989. Optimal Brain Damage. In Advances in Neural Information Processing Systems 2."},{"key":"e_1_3_2_1_25_1","volume-title":"International Conference on Learning Representations (ICLR). arXiv:1810","author":"Lee Namhoon","year":"2019","unstructured":"Namhoon Lee, Thalaiyasingam Ajanthan, and Philip HS Torr. 2019. SNIP: Single-shot network pruning based on connection sensitivity. International Conference on Learning Representations (ICLR). arXiv:1810.02340"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1093\/rfs\/14.1.113"},{"key":"e_1_3_2_1_27_1","volume-title":"Proceedings of the 29th International Conference on Machine Learning. arXiv:1206","author":"Martens James","year":"2012","unstructured":"James Martens, Ilya Sutskever, and Kevin Swersky. 2012. Estimating the Hessian by Back-propagating Curvature. Proceedings of the 29th International Conference on Machine Learning. arXiv:1206.6464"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","unstructured":"Decebal Constantin Mocanu Elena Mocanu Peter Stone Phuong H Nguyen Madeleine Gibescu and Antonio Liotta. 2018. Scalable training of artificial neural networks with adaptive sparse connectivity inspired by network science. Nature communications 9 2383. 10.1038\/s41467-018-04316-3","DOI":"10.1038\/s41467-018-04316-3"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1137\/1.9781611970906"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1137\/1.9780898717716"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1137\/1.9781611972078"},{"key":"e_1_3_2_1_32_1","volume-title":"Proceedings of the 32nd International Conference on Machine Learning","volume":"37","author":"Rezende Danilo","year":"2015","unstructured":"Danilo Rezende and Shakir Mohamed. 2015. Variational Inference with Normalizing Flows. In Proceedings of the 32nd International Conference on Machine Learning, Vol. 37. PMLR, 1530--1538. arXiv:1505.05770"},{"key":"e_1_3_2_1_33_1","volume-title":"1st workshop on approximate computing (WAPCO). 0278--0070","author":"Riehme Jan","year":"2015","unstructured":"Jan Riehme and Uwe Naumann. 2015. Significance analysis for numerical models. In 1st workshop on approximate computing (WAPCO). 0278--0070. https:\/\/wapco.e-ce.uth.gr\/2015\/papers\/SESSION3\/WAPCO_3_1.pdf"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1111\/j.1467-9965.2007.00326.x"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1063\/1.3677230"},{"key":"e_1_3_2_1_36_1","volume-title":"Proceedings of the 35th International Conference on Machine Learning","volume":"80","author":"Srinivas Suraj","year":"2018","unstructured":"Suraj Srinivas and Francois Fleuret. 2018. Knowledge Transfer with Jacobian Matching. In Proceedings of the 35th International Conference on Machine Learning, Vol. 80. PMLR, 4723--4731. arXiv:1803.00443"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.2139\/ssrn.3428994"},{"key":"e_1_3_2_1_38_1","volume-title":"Advances in Neural Information Processing Systems","volume":"29","author":"Wen Wei","year":"2016","unstructured":"Wei Wen, Chunpeng Wu, Yandan Wang, Yiran Chen, and Hai Li. 2016. Learning Structured Sparsity in Deep Neural Networks. In Advances in Neural Information Processing Systems, Vol. 29. arXiv:1608.03665"},{"key":"e_1_3_2_1_39_1","volume-title":"Advances in Neural Information Processing Systems","volume":"31","author":"Wilson James","year":"2018","unstructured":"James Wilson, Frank Hutter, and Marc Deisenroth. 2018. Maximizing acquisition functions for Bayesian optimization. In Advances in Neural Information Processing Systems, Vol. 31. arXiv:1805.10196"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1063\/1.4905332"},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.643"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1145\/3140659.3080215"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2005.04.010"}],"event":{"name":"PASC '24: Platform for Advanced Scientific Computing Conference","location":"Zurich Switzerland","acronym":"PASC '24","sponsor":["SIGHPC ACM Special Interest Group on High Performance Computing, Special Interest Group on High Performance Computing","ETH Zurich \/ CSCS"]},"container-title":["Proceedings of the Platform for Advanced Scientific Computing Conference"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3659914.3659915","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T00:03:37Z","timestamp":1750291417000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3659914.3659915"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,6,3]]},"references-count":43,"alternative-id":["10.1145\/3659914.3659915","10.1145\/3659914"],"URL":"https:\/\/doi.org\/10.1145\/3659914.3659915","relation":{},"subject":[],"published":{"date-parts":[[2024,6,3]]},"assertion":[{"value":"2024-06-03","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}