{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,18]],"date-time":"2025-12-18T14:19:54Z","timestamp":1766067594553,"version":"3.37.3"},"reference-count":47,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2022,8,26]],"date-time":"2022-08-26T00:00:00Z","timestamp":1661472000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2022,8,26]],"date-time":"2022-08-26T00:00:00Z","timestamp":1661472000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"The Key Research and Development Program of Zhejiang Province","award":["2019C01059","2019C03134","2019C03135"],"award-info":[{"award-number":["2019C01059","2019C03134","2019C03135"]}]},{"DOI":"10.13039\/501100001809","name":"The National Natural Science Foundation of China","doi-asserted-by":"crossref","award":["61972358"],"award-info":[{"award-number":["61972358"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100001809","name":"the National Natural Science Foundation of China","doi-asserted-by":"crossref","award":["62072146"],"award-info":[{"award-number":["62072146"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]},{"name":"The Science Foundation of Beijing","award":["L182053"],"award-info":[{"award-number":["L182053"]}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["CCF Trans. HPC"],"published-print":{"date-parts":[[2023,12]]},"DOI":"10.1007\/s42514-022-00098-9","type":"journal-article","created":{"date-parts":[[2022,8,26]],"date-time":"2022-08-26T03:27:52Z","timestamp":1661484472000},"page":"429-441","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["MP-DPS: adaptive distributed training for deep learning based on node merging and path prediction"],"prefix":"10.1007","volume":"5","author":[{"given":"Yan","family":"Zeng","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2026-417X","authenticated-orcid":false,"given":"Yong","family":"Ding","sequence":"additional","affiliation":[]},{"given":"Dongyang","family":"Ou","sequence":"additional","affiliation":[]},{"given":"Jilin","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Yongjian","family":"Ren","sequence":"additional","affiliation":[]},{"given":"Yunquan","family":"Zhang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,8,26]]},"reference":[{"key":"98_CR1","unstructured":"Addanki, R.: Learning generalizable device placement algorithms for distributed machine learning. Massachusetts Institute of Technology (2019)"},{"key":"98_CR2","unstructured":"Addanki, R., Bojja Venkatakrishnan, S., Gupta, S., Mao, H., Alizadeh, M.: Placeto: Learning generalizable device placement algorithms for distributed machine learning. arXiv preprint arXiv:1906.08879 (2019)"},{"key":"98_CR3","doi-asserted-by":"crossref","unstructured":"Alixandre, B., Dorn, M.: D-BRKGA: a distributed biased random-key genetic algorithm. In: 2017 IEEE congress on evolutionary computation (CEC). IEEE, (2017)","DOI":"10.1109\/CEC.2017.7969467"},{"issue":"3","key":"98_CR4","doi-asserted-by":"publisher","first-page":"682","DOI":"10.1109\/TPDS.2013.57","volume":"25","author":"H Arabnejad","year":"2014","unstructured":"Arabnejad, H., Barbosa, J.G.: List scheduling algorithm for heterogeneous systems by an optimistic cost table. IEEE Trans. Parallel Distrib. Syst. 25(3), 682\u2013694 (2014)","journal-title":"IEEE Trans. Parallel Distrib. Syst."},{"issue":"1","key":"98_CR5","doi-asserted-by":"publisher","first-page":"12035","DOI":"10.1088\/1742-6596\/1646\/1\/012035","volume":"1646","author":"Y Bai","year":"2020","unstructured":"Bai, Y., Wang, J., Wang, X., et al.: The summary of deep learning in the field of weather forecast research. J. Phys. Conf. Ser. 1646(1), 12035 (2020)","journal-title":"J. Phys. Conf. Ser."},{"key":"98_CR6","doi-asserted-by":"crossref","unstructured":"Ballard, G., Buluc, A., Demmel, J., et al.: Communication optimal parallel multiplication of sparse random matrices. In: Proceedings of the twenty-fifth annual ACM symposium on Parallelism in algorithms and architectures, pp 222\u2013231 (2013)","DOI":"10.1145\/2486159.2486196"},{"key":"98_CR7","doi-asserted-by":"publisher","first-page":"101","DOI":"10.1002\/cpe.4330060203","volume":"6","author":"ST Barnard","year":"1994","unstructured":"Barnard, S.T., Simon, H.D.: Fast multilevel implementation of recursive spectral bisection for partitioning unstructured problems. Concurr Pract Exp 6, 101\u2013117 (1994)","journal-title":"Concurr Pract Exp"},{"issue":"1","key":"98_CR8","doi-asserted-by":"publisher","first-page":"376","DOI":"10.1029\/2018MS001472","volume":"11","author":"T Bolton","year":"2019","unstructured":"Bolton, T., Zanna, L.: Applications of deep learning to ocean data inference and subgrid parameterization. J Adv Model Earth Syst 11(1), 376\u2013399 (2019)","journal-title":"J Adv Model Earth Syst"},{"key":"98_CR9","unstructured":"Brown, T.B., Mann, B., Nick, R., Subbiah, M., Kaplan, J., Dhariwal, P., Neelakantan, A., Shyam, P., Sastry, G., Askell, A., et al.: Language models are few-shot learners. arXiv preprint arXiv:2005.14165, 2020. pp xiv, 1, 3, 3, 3, 18, 19"},{"key":"98_CR10","unstructured":"Brown, T.B., Mann, B., Ryder, N., Subbiah, M., Kaplan, J., Dhariwal, P., Neelakantan, A., Shyam, P., Sastry, G., Askell, A., et al.: Language models are few-shot learners. arXiv preprint arXiv:2005.14165 (2020)."},{"key":"98_CR11","unstructured":"Cai, Z., Ma, K., Yan, X., Wu, Y., Huang, Y., Cheng, J., Su, T., Yu, F.: TensorOpt: exploring the tradeoffs in distributed DNN training with auto-parallelism. arXiv preprint arXiv:2004.10856 (2020)"},{"key":"98_CR12","doi-asserted-by":"crossref","unstructured":"Carion, N., Massa, F., Synnaeve, G., et al.: End-to-end object detection with transformers. In: European Conference on Computer Vision. Springer, Cham, pp 213\u2013229 (2020)","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"98_CR13","unstructured":"Dean, J.: A hierarchical model for device placement. In International conference on learning representations (2018)"},{"key":"98_CR14","unstructured":"Devlin, J., Chang, M.-W., Lee, K., Toutanova, K.: Bert: Pretraining of deep bidirectional transformers for language understanding. arXiv preprint arXiv:1810.04805, pp 1, 1, 3, 3, 40, 141, 142, 154, 154, 154, 154,163, 173 (2018)"},{"key":"98_CR15","unstructured":"Frazier, P.I.: A tutorial on Bayesian optimization. arXiv preprint arXiv:1807.02811 (2018)."},{"key":"98_CR16","unstructured":"Gao, Y., Chen,L., Li, B.: Post: Device placement with cross-entropy minimization and proximal policy optimization. In: Advances in neural information processing systems. 9971\u20139980 (2018)"},{"key":"98_CR17","unstructured":"Jia, Z., Lin, S., Qi, C.R., et al.: Exploring hidden dimensions in parallelizing convolutional neural networks. arXiv preprint arXiv:1802.04924, (2018)"},{"key":"98_CR18","unstructured":"Jia, Z., Zaharia, M., Aiken, A.. Beyond data and model parallelism for deep neural networks. arXiv preprint arXiv:1807.05358 (2018)."},{"key":"98_CR19","first-page":"1095","volume":"2012","author":"S Kim","year":"2012","unstructured":"Kim, S., Xing, E.P.: Tree-guided group lasso for multi-response regression with structured sparsity, with an application to eQTL mapping. Ann. Appl. Stat. 2012, 1095\u20131117 (2012)","journal-title":"Ann. Appl. Stat."},{"key":"98_CR20","first-page":"125","volume-title":"Semantic object parsing with graph LSTM[C]\/\/European conference on computer vision","author":"X Liang","year":"2016","unstructured":"Liang, X., Shen, X., Feng, J., et al.: Semantic object parsing with graph LSTM[C]\/\/European conference on computer vision, pp. 125\u2013143. Springer, Cham (2016)"},{"key":"98_CR21","unstructured":"Mirhoseini, A., Pham, H., Le, Q.V., Steiner, B., Larsen, R., Zhou, Y., Kumar, N., Norouzi, M., Bengio, S., Dean, J.: Device placement optimization with reinforcement learning. In: International conference on machine learning. PMLR, 2430\u20132439 (2017a)"},{"key":"98_CR22","unstructured":"Mirhoseini, A., Pham, H., Le, Q.V., Steiner, B., Larsen, R., Zhou, Y., Kumar, N., Norouzi, M., Bengio, S., Dean, J.: Device placement optimization with reinforcement learning. In: International Conference on Machine Learning. PMLR, 2430\u20132439 (2017b)"},{"key":"98_CR23","unstructured":"Mirhoseini, A., Pham, H., Le, Q.V., et al.: Device placement optimization with reinforcement learning. In: International Conference on Machine Learning. PMLR, pp 2430\u20132439 (2017)"},{"key":"98_CR24","unstructured":"Mirhoseini, A., Goldie, A., Pham, H., Steiner, B., Le, Q.V, Dean J.: A hierarchical model for device placement. In International conference on learning representations (2018)"},{"key":"98_CR25","unstructured":"Neubig, G., Dyer, C., Goldberg, Y., et al.: Dynet: The dynamic neural network toolkit. arXiv preprint arXiv:1701.03980, (2017)"},{"key":"98_CR26","unstructured":"Pellegrini, F.: Distillating knowledge about Scotch. In Dagstuhl Seminar Proceedings. Schloss Dagstuhl-Leibniz-Zentrum f\u00fcr Informatik (2009a)"},{"key":"98_CR27","unstructured":"Pellegrini, F.: Distillating knowledge about Scotch. In: Dagstuhl Seminar Proceedings. Schloss Dagstuhl-Leibniz-Zentrum f\u00fcr Informatik (2009b)"},{"key":"98_CR28","unstructured":"Pellegrini, F., Roman, J.: Experimental analysis of the dual recursive bipartitioning algorithm for static mapping. In TR 1038\u201396, LaBRI, URA CNRS 1304, Univ. Bordeaux I. Citeseer (1996)"},{"key":"98_CR29","doi-asserted-by":"crossref","unstructured":"Peng, Y., Bao, Y., Chen, Y., Wu, C., Guo, C.: Optimus: an efficient dynamic resource scheduler for deep learning clusters. In: Proceedings of the Thirteenth EuroSys Conference. 1\u201314 (2018)","DOI":"10.1145\/3190508.3190517"},{"key":"98_CR30","doi-asserted-by":"crossref","unstructured":"Peters, M.E., Ammar, W., Bhagavatula, C., Power R.: Semi-supervised sequence tagging with bidirectional language models. arXiv preprint arXiv:1705.00108 (2017)","DOI":"10.18653\/v1\/P17-1161"},{"key":"98_CR31","unstructured":"Paliwal, A., Gimeno, F., Nair, V., Li,Y., Lubin, M., Kohli, P., Vinyals, O.: Reinforced genetic algorithm learning for optimizing computation graphs. arXiv preprint arXiv:1905.02494 (2019a)."},{"key":"98_CR32","unstructured":"Paliwal, A., Gimeno, F., Nair, V., Li, Y., Lubin, M., Kohli, P., Vinyals, O.: Reinforced genetic algorithm learning for optimizing computation graphs. arXiv preprint arXiv:1905.02494 (2019b)"},{"key":"98_CR33","unstructured":"Raffel, C., Shazeer, N., Roberts, A., Lee, K., Narang, S., Matena, M., Zhou, Y., Li, W., Liu, P.J.: Exploring the limits of transfer learning with a unified text-to-text transformer. arXiv preprint arXiv:1910.10683, p 1 (2019)"},{"key":"98_CR34","unstructured":"Shazeer, N., Mirhoseini, A., Maziarz, K., Davis, A., Le, Q., Hinton, G., Dean, J.: Outrageously large neural networks: The sparsely-gated mixtureof-experts layer. arXiv preprint arXiv:1701.06538, pp 1, 32, 32, 88 (2017)"},{"issue":"7587","key":"98_CR35","doi-asserted-by":"publisher","first-page":"484","DOI":"10.1038\/nature16961","volume":"529","author":"D Silver","year":"2016","unstructured":"Silver, D., Huang, A., Maddison, C.J., Guez, A., Sifre, L., VanDen, D.G., Schrittwieser, J., Antonoglou, I., Panneershelvam, V., Lanctot, M., et al.: Mastering the game of go with deep neural networks and tree search. Nature 529(7587), 484\u2013489 (2016)","journal-title":"Nature"},{"key":"98_CR36","unstructured":"Sun, S., Chen, W., Bian, J., Liu, X., Liu, T.-Y.:. Slim-DP: a multi-agent system for communication-efficient distributed deep learning. In Proceedings of the 17th International Conference on Autonomous Agents and MultiAgent Systems. pp 721\u2013729 (2018)"},{"key":"98_CR37","unstructured":"Sutskever, I., Vinyals, O., Le, Q.V.: Sequence to sequence learning with neural networks. arXiv preprint arXiv:1409.3215 (2014)"},{"key":"98_CR38","unstructured":"Tensorflow slim (2016) https:\/\/github.com\/tensorflow\/tensorflow\/tree\/master\/tensorflow\/contrib\/slim."},{"issue":"3","key":"98_CR39","doi-asserted-by":"publisher","first-page":"293","DOI":"10.1001\/jamainternmed.2018.7117","volume":"179","author":"F Wang","year":"2019","unstructured":"Wang, F., Casalino, L.P., Khullar, D.: Deep learning in medicine\u2014promise, progress, and challenges. JAMA Intern. Med. 179(3), 293\u2013294 (2019a)","journal-title":"JAMA Intern. Med."},{"key":"98_CR40","doi-asserted-by":"crossref","unstructured":"Wang, M., Huang, C., Li, J.: Supporting very large models using automatic dataflow graph partitioning[C]. In: Proceedings of the Fourteenth EuroSys Conference 2019b, 1\u201317. (2019b)","DOI":"10.1145\/3302424.3303953"},{"key":"98_CR41","unstructured":"Wang, L., Guo, Z.H., Cao, F., et al.: Automatic generation method of model splitting strategy for model parallel training. Comput Eng Sci (2020)"},{"key":"98_CR42","unstructured":"Wu, Y., Schuster, M., Chen, Z., Le, Q.L., Norouzi, M., Macherey, W., Krikun, M., Cao, Y., Gao, Q., Macherey, K., et al.: Google\u2019s neural machine translation system: Bridging the gap between human and machine translation. arXiv preprint arXiv:1609.08144 (2016)"},{"key":"98_CR43","doi-asserted-by":"crossref","unstructured":"Yi, X., Luo, Z., Meng, C., et al.: Fast training of deep learning models over multiple GPUs[C]. In: Proceedings of the 21st International middleware conference., pp 105\u2013118. (2020)","DOI":"10.1145\/3423211.3425675"},{"key":"98_CR44","doi-asserted-by":"crossref","unstructured":"Yu, C., Gao, C., Wang, J., et al.: Bisenet v2: Bilateral network with guided aggregation for real-time semantic segmentation. arXiv preprint arXiv:2004.02147, (2020)","DOI":"10.1007\/s11263-021-01515-2"},{"key":"98_CR45","doi-asserted-by":"crossref","unstructured":"Zhang, S., Tay, Y., Yao, L., et al.: Deeprec: An open-source toolkit for deep learning based recommendation. arXiv preprint arXiv:1905.10536, (2019)","DOI":"10.24963\/ijcai.2019\/963"},{"key":"98_CR46","first-page":"906","volume":"33","author":"H Zhang","year":"2020","unstructured":"Zhang, H., Li, Y., Deng, Z., et al.: AutoSync: learning to synchronize for data-parallel distributed deep learning. Adv Neural Inf Process Syst 33, 906\u2013917 (2020)","journal-title":"Adv Neural Inf Process Syst"},{"key":"98_CR47","unstructured":"Zhou, Q.: Research on task scheduling method of heterogeneous multi-processor in distributed environment. South China Univ. Technol. (2017)"}],"container-title":["CCF Transactions on High Performance Computing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s42514-022-00098-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s42514-022-00098-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s42514-022-00098-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,12,15]],"date-time":"2023-12-15T12:04:18Z","timestamp":1702641858000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s42514-022-00098-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,8,26]]},"references-count":47,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2023,12]]}},"alternative-id":["98"],"URL":"https:\/\/doi.org\/10.1007\/s42514-022-00098-9","relation":{},"ISSN":["2524-4922","2524-4930"],"issn-type":[{"type":"print","value":"2524-4922"},{"type":"electronic","value":"2524-4930"}],"subject":[],"published":{"date-parts":[[2022,8,26]]},"assertion":[{"value":"14 December 2021","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"6 March 2022","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"26 August 2022","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}