{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,25]],"date-time":"2025-03-25T18:17:21Z","timestamp":1742926641214,"version":"3.40.3"},"publisher-location":"Cham","reference-count":24,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783031061554"},{"type":"electronic","value":"9783031061561"}],"license":[{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022]]},"DOI":"10.1007\/978-3-031-06156-1_30","type":"book-chapter","created":{"date-parts":[[2022,6,8]],"date-time":"2022-06-08T20:29:39Z","timestamp":1654720179000},"page":"376-387","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Parallelizing Automatic Model Management System for AIOps on Microservice Platforms"],"prefix":"10.1007","author":[{"given":"Ruibo","family":"Chen","sequence":"first","affiliation":[]},{"given":"Wenjun","family":"Wu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,6,9]]},"reference":[{"issue":"4","key":"30_CR1","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3320060","volume":"52","author":"T Ben-Nun","year":"2019","unstructured":"Ben-Nun, T., Hoefler, T.: Demystifying parallel and distributed deep learning: an in-depth concurrency analysis. ACM Comput. Surv. (CSUR) 52(4), 1\u201343 (2019)","journal-title":"ACM Comput. Surv. (CSUR)"},{"issue":"4","key":"30_CR2","doi-asserted-by":"publisher","first-page":"29","DOI":"10.1145\/3183628.3183631","volume":"17","author":"T Cerny","year":"2018","unstructured":"Cerny, T., Donahoo, M.J., Trnka, M.: Contextual understanding of microservice architecture: current and future directions. ACM SIGAPP Appl. Comput. Rev. 17(4), 29\u201345 (2018)","journal-title":"ACM SIGAPP Appl. Comput. Rev."},{"key":"30_CR3","unstructured":"Chen, C.C., Yang, C.L., Cheng, H.Y.: Efficient and robust parallel DNN training through model parallelism on multi-GPU platform. arXiv preprint arXiv:1809.02839 (2018)"},{"key":"30_CR4","doi-asserted-by":"crossref","unstructured":"Dang, Y., Lin, Q., Huang, P.: AIOps: real-world challenges and research innovations. In: 2019 IEEE\/ACM 41st International Conference on Software Engineering: Companion Proceedings (ICSE-Companion), pp. 4\u20135. IEEE (2019)","DOI":"10.1109\/ICSE-Companion.2019.00023"},{"key":"30_CR5","unstructured":"Diethe, T., Borchert, T., Thereska, E., Balle, B., Lawrence, N.: Continual learning in practice. arXiv preprint arXiv:1903.05202 (2019)"},{"issue":"3","key":"30_CR6","doi-asserted-by":"publisher","first-page":"94","DOI":"10.1109\/MS.2016.68","volume":"33","author":"C Ebert","year":"2016","unstructured":"Ebert, C., Gallardo, G., Hernantes, J., Serrano, N.: DevOps. IEEE Softw. 33(3), 94\u2013100 (2016)","journal-title":"IEEE Softw."},{"key":"30_CR7","doi-asserted-by":"crossref","unstructured":"Fontenla-Romero, \u00d3., Guijarro-Berdi\u00f1as, B., Martinez-Rego, D., P\u00e9rez-S\u00e1nchez, B., Peteiro-Barral, D.: Online machine learning. In: Efficiency and Scalability Methods for Computational Intellect, pp. 27\u201354. IGI Global (2013)","DOI":"10.4018\/978-1-4666-3942-3.ch002"},{"key":"30_CR8","doi-asserted-by":"crossref","unstructured":"Haselb\u00f6ck, S., Weinreich, R.: Decision guidance models for microservice monitoring. In: 2017 IEEE International Conference on Software Architecture Workshops (ICSAW), pp. 54\u201361. IEEE (2017)","DOI":"10.1109\/ICSAW.2017.31"},{"key":"30_CR9","doi-asserted-by":"crossref","unstructured":"Hecht-Nielsen, R.: Theory of the backpropagation neural network. In: Neural Networks for Perception, pp. 65\u201393. Elsevier (1992)","DOI":"10.1016\/B978-0-12-741252-8.50010-8"},{"key":"30_CR10","volume-title":"Continuous Delivery: Reliable Software Releases Through Build, Test, and Deployment Automation","author":"J Humble","year":"2010","unstructured":"Humble, J., Farley, D.: Continuous Delivery: Reliable Software Releases Through Build, Test, and Deployment Automation. Pearson Education, London (2010)"},{"issue":"7553","key":"30_CR11","doi-asserted-by":"publisher","first-page":"436","DOI":"10.1038\/nature14539","volume":"521","author":"Y LeCun","year":"2015","unstructured":"LeCun, Y., Bengio, Y., Hinton, G.: Deep learning. Nature 521(7553), 436\u2013444 (2015)","journal-title":"Nature"},{"issue":"2","key":"30_CR12","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3385187","volume":"29","author":"Y Li","year":"2020","unstructured":"Li, Y., et al.: Predicting node failures in an ultra-large-scale cloud computing platform: an AIOps solution. ACM Trans. Softw. Eng. Methodol. (TOSEM) 29(2), 1\u201324 (2020)","journal-title":"ACM Trans. Softw. Eng. Methodol. (TOSEM)"},{"key":"30_CR13","unstructured":"Littman, M.S., Metcalf, C.D.: An exploration of asynchronous data-parallelism. Personal communication (1990)"},{"key":"30_CR14","doi-asserted-by":"publisher","unstructured":"Masood, A., Hashmi, A.: AIOps: predictive analytics & machine learning in operations. In: Cognitive Computing Recipes, pp. 359\u2013382. Springer, Berkeley (2019). https:\/\/doi.org\/10.1007\/978-1-4842-4106-6_7","DOI":"10.1007\/978-1-4842-4106-6_7"},{"key":"30_CR15","unstructured":"Park, J.H., et al.: HetPipe: enabling large $$\\{$$DNN$$\\}$$ training on (Whimpy) heterogeneous $$\\{$$GPU$$\\}$$ clusters through integration of pipelined model parallelism and data parallelism. In: 2020 $$\\{$$USENIX$$\\}$$ Annual Technical Conference ($$\\{$$USENIX$$\\}$$$$\\{$$ATC$$\\}$$ 2020), pp. 307\u2013321 (2020)"},{"issue":"4","key":"30_CR16","first-page":"51","volume":"10","author":"R Schneider","year":"2008","unstructured":"Schneider, R.: Continuous integration: improving software quality and reducing risk. Softw. Qual. Prof. 10(4), 51 (2008)","journal-title":"Softw. Qual. Prof."},{"key":"30_CR17","unstructured":"Shallue, C.J., Lee, J., Antognini, J., Sohl-Dickstein, J., Frostig, R., Dahl, G.E.: Measuring the effects of data parallelism on neural network training. arXiv preprint arXiv:1811.03600 (2018)"},{"key":"30_CR18","doi-asserted-by":"crossref","unstructured":"Singh, V., Peddoju, S.K.: Container-based microservice architecture for cloud applications. In: 2017 International Conference on Computing, Communication and Automation (ICCCA), pp. 847\u2013852. IEEE (2017)","DOI":"10.1109\/CCAA.2017.8229914"},{"key":"30_CR19","doi-asserted-by":"crossref","unstructured":"Stocco, A., Tonella, P.: Towards anomaly detectors that learn continuously. In: 2020 IEEE International Symposium on Software Reliability Engineering Workshops (ISSREW), pp. 201\u2013208. IEEE (2020)","DOI":"10.1109\/ISSREW51248.2020.00073"},{"key":"30_CR20","doi-asserted-by":"crossref","unstructured":"Subhlok, J., Stichnoth, J.M., O\u2019hallaron, D.R., Gross, T.: Exploiting task and data parallelism on a multicomputer. In: Proceedings of the Fourth ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming, pp. 13\u201322 (1993)","DOI":"10.1145\/173284.155334"},{"key":"30_CR21","doi-asserted-by":"crossref","unstructured":"Tamburri, D.A.: Sustainable MLOps: trends and challenges. In: 2020 22nd International Symposium on Symbolic and Numeric Algorithms for Scientific Computing (SYNASC), pp. 17\u201323. IEEE (2020)","DOI":"10.1109\/SYNASC51798.2020.00015"},{"key":"30_CR22","doi-asserted-by":"crossref","unstructured":"Wang, L., Zhao, N., Chen, J., Li, P., Zhang, W., Sui, K.: Root-cause metric location for microservice systems via log anomaly detection. In: 2020 IEEE International Conference on Web Services (ICWS), pp. 142\u2013150. IEEE (2020)","DOI":"10.1109\/ICWS49710.2020.00026"},{"key":"30_CR23","doi-asserted-by":"crossref","unstructured":"Zhou, Y., Yu, Y., Ding, B.: Towards MLOps: a case study of ML pipeline platform. In: 2020 International Conference on Artificial Intelligence and Computer Engineering (ICAICE), pp. 494\u2013500. IEEE (2020)","DOI":"10.1109\/ICAICE51518.2020.00102"},{"issue":"3","key":"30_CR24","doi-asserted-by":"publisher","first-page":"32","DOI":"10.1109\/MS.2016.81","volume":"33","author":"L Zhu","year":"2016","unstructured":"Zhu, L., Bass, L., Champlin-Scharff, G.: DevOps and its practices. IEEE Softw. 33(3), 32\u201334 (2016)","journal-title":"IEEE Softw."}],"container-title":["Lecture Notes in Computer Science","Euro-Par 2021: Parallel Processing Workshops"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-06156-1_30","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,6,8]],"date-time":"2022-06-08T20:32:51Z","timestamp":1654720371000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-06156-1_30"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022]]},"ISBN":["9783031061554","9783031061561"],"references-count":24,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-06156-1_30","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2022]]},"assertion":[{"value":"9 June 2022","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"Euro-Par","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Parallel Processing","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Lisbon","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Portugal","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2021","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"30 August 2021","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"31 August 2021","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"27","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"europar2021","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/2021.euro-par.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Single-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"EasyChair","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"136","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"39","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"29% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"4","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"6","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"The conference was held virtually due to the COVID-19 pandemic.","order":10,"name":"additional_info_on_review_process","label":"Additional Info on Review Process","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}