{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,21]],"date-time":"2026-02-21T08:29:55Z","timestamp":1771662595665,"version":"3.50.1"},"reference-count":25,"publisher":"Zhejiang University Press","issue":"1","license":[{"start":{"date-parts":[[2024,12,27]],"date-time":"2024-12-27T00:00:00Z","timestamp":1735257600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,12,27]],"date-time":"2024-12-27T00:00:00Z","timestamp":1735257600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Front Inform Technol Electron Eng"],"published-print":{"date-parts":[[2025,1]]},"DOI":"10.1631\/fitee.2300684","type":"journal-article","created":{"date-parts":[[2024,12,26]],"date-time":"2024-12-26T17:03:34Z","timestamp":1735232614000},"page":"109-118","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Automatic parallelism strategy generation with minimal memory redundancy","\u6700\u5c0f\u5316\u5185\u5b58\u5197\u4f59\u7684\u81ea\u52a8\u5e76\u884c\u7b56\u7565\u751f\u6210\u65b9\u6cd5"],"prefix":"10.1631","volume":"26","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-8899-1018","authenticated-orcid":false,"given":"Yanqi","family":"Shi","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5590-5179","authenticated-orcid":false,"given":"Peng","family":"Liang","sequence":"additional","affiliation":[]},{"given":"Hao","family":"Zheng","sequence":"additional","affiliation":[]},{"given":"Linbo","family":"Qiao","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9743-2034","authenticated-orcid":false,"given":"Dongsheng","family":"Li","sequence":"additional","affiliation":[]}],"member":"635","published-online":{"date-parts":[[2024,12,27]]},"reference":[{"key":"ref1","article-title":"Language models are few-shot learners","volume-title":"Proc 34th Int Conf on Neural Information Processing Systems","author":"Brown","year":"2020"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/tpds.2021.3132413"},{"key":"ref3","author":"Chowdhery","year":"2022","journal-title":"PaLM: scaling language modeling with pathways"},{"key":"ref4","author":"Dan","year":"2023","journal-title":"EduChat: a large-scale language model-based chatbot system for intelligent education"},{"key":"ref5","first-page":"4171","article-title":"BERT: pre-training of deep bidirectional Transformers for language under-standing","volume-title":"Proc Conf of the 9th American Chapter of the Association for Computational Linguistics: Human Language Technologies","author":"Devlin","year":"2019"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1631\/fitee.1800566"},{"key":"ref7","author":"Harlap","year":"2018","journal-title":"PipeDream: fast and efficient pipeline parallel DNN training"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1631\/fitee.2200412"},{"key":"ref9","article-title":"GPipe: efficient training of giant neural networks using pipeline parallelism","volume-title":"Proc 33rd Int Conf on Neural Information Processing Systems","author":"Huang","year":"2019"},{"key":"ref10","first-page":"2274","article-title":"Exploring hidden dimensions in accelerating convolutional neural networks","volume-title":"Proc 35th Int Conf on Machine Learning","author":"Jia","year":"2018"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1145\/3065386"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1631\/fitee.1601771"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1145\/3605573.3605613"},{"key":"ref14","author":"Liu","year":"2023","journal-title":"Colossal-Auto: unified automation of parallelization and activation checkpoint for large-scale models"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1145\/3581784.3607073"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1631\/fitee.1800421"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1145\/3458817.3476209"},{"key":"ref18","author":"Naumov","year":"2019","journal-title":"Deep learning recommendation model for personalization and recommendation systems"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/SC41405.2020.00024"},{"key":"ref20","first-page":"10435","article-title":"Mesh-TensorFlow: deep learning for supercomputers","volume-title":"Proc 32nd Int Conf on Neural Information Processing Systems","author":"Shazeer","year":"2018"},{"key":"ref21","author":"Shoeybi","year":"2019","journal-title":"Megatron-LM: training multi-billion parameter language models using model parallelism"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/3302424.3303953"},{"key":"ref24","first-page":"559","article-title":"Alpa: automating inter- and intra-operator parallelism for distributed deep learning","volume-title":"Proc 16th USENIX Symp on Operating Systems Design and Implementation","author":"Zheng","year":"2022"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1631\/fitee.1601883"}],"container-title":["Frontiers of Information Technology &amp; Electronic Engineering"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1631\/FITEE.2300684.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1631\/FITEE.2300684\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1631\/FITEE.2300684.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,2,21]],"date-time":"2026-02-21T07:54:24Z","timestamp":1771660464000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1631\/FITEE.2300684"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12,27]]},"references-count":25,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2025,1]]}},"alternative-id":["684"],"URL":"https:\/\/doi.org\/10.1631\/fitee.2300684","relation":{},"ISSN":["2095-9184","2095-9230"],"issn-type":[{"value":"2095-9184","type":"print"},{"value":"2095-9230","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,12,27]]},"assertion":[{"value":"10 October 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"17 October 2023","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 December 2024","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"Dongsheng LI is a corresponding expert of\n                      Frontiers of Information Technology & Electronic Engineering\n                      , and he was not involved with the peer review process of this paper. All the authors declare that they have no conflict of interest.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}