{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,23]],"date-time":"2025-08-23T00:40:06Z","timestamp":1755909606909,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":28,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,4,22]],"date-time":"2024-04-22T00:00:00Z","timestamp":1713744000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"UKRI and EPSRC","award":["EP\/S022694\/1"],"award-info":[{"award-number":["EP\/S022694\/1"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,4,22]]},"DOI":"10.1145\/3642970.3655847","type":"proceedings-article","created":{"date-parts":[[2024,4,19]],"date-time":"2024-04-19T10:46:57Z","timestamp":1713523617000},"page":"176-183","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Comparative Profiling"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0003-7994-6498","authenticated-orcid":false,"given":"Bradley","family":"Aldous","sequence":"first","affiliation":[{"name":"Queen Mary University of London, London, United Kingdom"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1374-1882","authenticated-orcid":false,"given":"Ahmed M.","family":"Abdelmoniem","sequence":"additional","affiliation":[{"name":"Queen Mary University of London, London, United Kingdom"}]}],"member":"320","published-online":{"date-parts":[[2024,4,22]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1186\/s40537-023-00765-w"},{"key":"e_1_3_2_1_2_1","unstructured":"Mart\u00edn Abadi Ashish Agarwal Paul Barham Eugene Brevdo Zhifeng Chen Craig Citro Greg S. Corrado Andy Davis Jeffrey Dean Matthieu Devin Sanjay Ghemawat Ian Goodfellow Andrew Harp Geoffrey Irving Michael Isard Yangqing Jia Rafal Jozefowicz Lukasz Kaiser Manjunath Kudlur Josh Levenberg Dandelion Man\u00e9 Rajat Monga Sherry Moore Derek Murray Chris Olah Mike Schuster Jonathon Shlens Benoit Steiner Ilya Sutskever Kunal Talwar Paul Tucker Vincent Vanhoucke Vijay Vasudevan Fernanda Vi\u00e9gas Oriol Vinyals Pete Warden Martin Wattenberg Martin Wicke Yuan Yu and Xiaoqiang Zheng. 2015. TensorFlow: Large-Scale Machine Learning on Heterogeneous Systems. https:\/\/www.tensorflow.org\/ Software available from tensorflow.org."},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1109\/INFOCOM42981.2021.9488810"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1186\/s41235-023-00499-6"},{"key":"e_1_3_2_1_5_1","unstructured":"Lukas Biewald. 2020. Experiment Tracking with Weights and Biases. https:\/\/www.wandb.com\/ Software available from wandb.com."},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1109\/CEIT.2018.8751930"},{"key":"e_1_3_2_1_7_1","volume-title":"MXNet: A Flexible and Efficient Machine Learning Library for Heterogeneous Distributed Systems. (12","author":"Chen Tianqi","year":"2015","unstructured":"Tianqi Chen, Mu Li, Yutian Li, Min Lin, Naiyan Wang, Minjie Wang, Tianjun Xiao, Bing Xu, Chiyuan Zhang, and Zheng Zhang. 2015. MXNet: A Flexible and Efficient Machine Learning Library for Heterogeneous Distributed Systems. (12 2015). http:\/\/arxiv.org\/abs\/1512.01274"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","unstructured":"William Falcon and The PyTorch Lightning team. 2019. PyTorch Lightning. https:\/\/doi.org\/10.5281\/zenodo.3828935","DOI":"10.5281\/zenodo.3828935"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCC202255925.2022.9922765"},{"key":"e_1_3_2_1_10_1","volume-title":"Michael McThrow, Tao Komikado, Koji Maruhashi, Kanji Uchino, Xiaoning Qian, and Shuiwang Ji.","author":"Fu Cong","year":"2023","unstructured":"Cong Fu, Keqiang Yan, Limei Wang, Wing Yee Au, Michael McThrow, Tao Komikado, Koji Maruhashi, Kanji Uchino, Xiaoning Qian, and Shuiwang Ji. 2023. A Latent Diffusion Model for Protein Structure Generation. arXiv:2305.04120 [q-bio.BM]"},{"key":"e_1_3_2_1_11_1","volume-title":"Comparative Analysis of CPU and GPU Profiling for Deep Learning Models. (9","author":"Gyawali Dipesh","year":"2023","unstructured":"Dipesh Gyawali. 2023. Comparative Analysis of CPU and GPU Profiling for Deep Learning Models. (9 2023). http:\/\/arxiv.org\/abs\/2309.02521"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1145\/2647868.2654889"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N19-1011"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.14778\/3415478.3415530"},{"key":"e_1_3_2_1_15_1","volume-title":"Plumbley","author":"Liu Haohe","year":"2023","unstructured":"Haohe Liu, Zehua Chen, Yi Yuan, Xinhao Mei, Xubo Liu, Danilo Mandic, Wenwu Wang, and Mark D. Plumbley. 2023. AudioLDM: Text-to-Audio Generation with Latent Diffusion Models. (1 2023). https:\/\/arxiv.org\/abs\/2301.12503"},{"key":"e_1_3_2_1_16_1","volume-title":"Plumbley","author":"Liu Haohe","year":"2023","unstructured":"Haohe Liu, Qiao Tian, Yi Yuan, Xubo Liu, Xinhao Mei, Qiuqiang Kong, Yuping Wang, Wenwu Wang, Yuxuan Wang, and Mark D. Plumbley. 2023. AudioLDM 2: Learning Holistic Audio Generation with Self-supervised Pretraining. (8 2023). http:\/\/arxiv.org\/abs\/2308.05734"},{"key":"e_1_3_2_1_17_1","volume-title":"Proceedings of Machine Learning and Systems, A. Smola, A. Dimakis, and I. Stoica (Eds.)","volume":"3","author":"Abdelmoniem Ahmed M.","year":"2021","unstructured":"Ahmed M. Abdelmoniem, Ahmed Elzanaty, Mohamed-Slim Alouini, and Marco Canini. 2021. An Efficient Statistical-based Gradient Compression Technique for Distributed Training Systems. In Proceedings of Machine Learning and Systems, A. Smola, A. Dimakis, and I. Stoica (Eds.), Vol. 3. 297--322. https:\/\/proceedings.mlsys.org\/paper_files\/paper\/2021\/file\/fea47a8aa372e42f3c84327aec9506cf-Paper.pdf"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.2120481119"},{"key":"e_1_3_2_1_19_1","unstructured":"PyTorch. 2021. Introducing PyTorch Profiler - the new and improved performance tool. https:\/\/pytorch.org\/docs\/stable\/profiler.html Software available from https:\/\/pytorch.org."},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1145\/3394486.3406703"},{"key":"e_1_3_2_1_21_1","volume-title":"High-Resolution Image Synthesis with Latent Diffusion Models. (12","author":"Rombach Robin","year":"2021","unstructured":"Robin Rombach, Andreas Blattmann, Dominik Lorenz, Patrick Esser, and Bj\u00f6rn Ommer. 2021. High-Resolution Image Synthesis with Latent Diffusion Models. (12 2021). http:\/\/arxiv.org\/abs\/2112.10752"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1109\/HIPC.2009.5433185"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/2939672.2945397"},{"key":"e_1_3_2_1_24_1","volume-title":"Horovod: fast and easy distributed deep learning in TensorFlow. (2","author":"Sergeev Alexander","year":"2018","unstructured":"Alexander Sergeev and Mike Del Balso. 2018. Horovod: fast and easy distributed deep learning in TensorFlow. (2 2018). https:\/\/arxiv.org\/abs\/1802.05799"},{"key":"e_1_3_2_1_25_1","volume-title":"Performance Modeling and Evaluation of Distributed Deep Learning Frameworks on GPUs. (11","author":"Shi Shaohuai","year":"2017","unstructured":"Shaohuai Shi, Qiang Wang, and Xiaowen Chu. 2017. Performance Modeling and Evaluation of Distributed Deep Learning Frameworks on GPUs. (11 2017). http:\/\/arxiv.org\/abs\/1711.05979"},{"key":"e_1_3_2_1_26_1","volume-title":"Proceedings of the 32nd International Conference on Machine Learning, 2256--2265","author":"Sohl-Dickstein Jascha","year":"2015","unstructured":"Jascha Sohl-Dickstein, Eric Weiss, Niru Maheswaranathan, and Surya Ganguli. 2015. Deep Unsupervised Learning using Nonequilibrium Thermodynamics. Proceedings of the 32nd International Conference on Machine Learning, 2256--2265."},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/2872887.2750375"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1145\/3578356.3592589"}],"event":{"name":"EuroSys '24: Nineteenth European Conference on Computer Systems","sponsor":["SIGOPS ACM Special Interest Group on Operating Systems"],"location":"Athens Greece","acronym":"EuroSys '24"},"container-title":["Proceedings of the 4th Workshop on Machine Learning and Systems"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3642970.3655847","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3642970.3655847","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,23]],"date-time":"2025-08-23T00:15:54Z","timestamp":1755908154000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3642970.3655847"}},"subtitle":["Insights Into Latent Diffusion Model Training"],"short-title":[],"issued":{"date-parts":[[2024,4,22]]},"references-count":28,"alternative-id":["10.1145\/3642970.3655847","10.1145\/3642970"],"URL":"https:\/\/doi.org\/10.1145\/3642970.3655847","relation":{},"subject":[],"published":{"date-parts":[[2024,4,22]]},"assertion":[{"value":"2024-04-22","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}