{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,19]],"date-time":"2026-03-19T15:25:56Z","timestamp":1773933956856,"version":"3.50.1"},"reference-count":30,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,11,11]],"date-time":"2025-11-11T00:00:00Z","timestamp":1762819200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,11,11]],"date-time":"2025-11-11T00:00:00Z","timestamp":1762819200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100007129","name":"Natural Science Foundation of Shandong Province","doi-asserted-by":"publisher","award":["No. ZR2023LZH010"],"award-info":[{"award-number":["No. ZR2023LZH010"]}],"id":[{"id":"10.13039\/501100007129","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Cluster Comput"],"published-print":{"date-parts":[[2026,2]]},"DOI":"10.1007\/s10586-025-05782-3","type":"journal-article","created":{"date-parts":[[2025,11,11]],"date-time":"2025-11-11T20:27:45Z","timestamp":1762892865000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Local feedback and dynamic adjustment best offset prefetcher in CXL-SSD"],"prefix":"10.1007","volume":"29","author":[{"given":"Shibao","family":"Li","sequence":"first","affiliation":[]},{"given":"Zhou","family":"Yang","sequence":"additional","affiliation":[]},{"given":"Chengzhi","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Yunwu","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Wei","family":"Dou","sequence":"additional","affiliation":[]},{"given":"Xuerong","family":"Cui","sequence":"additional","affiliation":[]},{"given":"Jianhang","family":"Liu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,11,11]]},"reference":[{"key":"5782_CR1","doi-asserted-by":"publisher","first-page":"2393","DOI":"10.1109\/TCAD.2024.3371268","volume":"43","author":"F Zhang","year":"2024","unstructured":"Zhang, F., Sridharan, A., Hwang, W., Xue, F., Tsai, W., Wang, S.X., Fan, D.: On-device continual learning with stt-assisted-sot mram based in-memory computing. IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems 43, 2393\u20132404 (2024)","journal-title":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems"},{"key":"5782_CR2","doi-asserted-by":"publisher","first-page":"1065","DOI":"10.1109\/TCAD.2023.3333754","volume":"43","author":"K Mishty","year":"2023","unstructured":"Mishty, K., Sadi, M.: System and design technology co-optimization of sot-mram for high-performance ai accelerator memory system. IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems 43, 1065\u20131078 (2023)","journal-title":"IEEE Transactions on Computer-Aided Design of Integrated Circuits and Systems"},{"key":"5782_CR3","doi-asserted-by":"publisher","first-page":"33","DOI":"10.1109\/MM.2024.3373763","volume":"44","author":"A Gholami","year":"2024","unstructured":"Gholami, A., Yao, Z., Kim, S., Hooper, C., Mahoney, M.W., Keutzer, K.: Ai and memory wall. IEEE Micro 44, 33\u201339 (2024)","journal-title":"IEEE Micro"},{"issue":"240","key":"5782_CR4","first-page":"1","volume":"24","author":"A Chowdhery","year":"2023","unstructured":"Chowdhery, A., Narang, S., Devlin, J., Bosma, M., Mishra, G., Roberts, A., Barham, P., Chung, H.W., Sutton, C., Gehrmann, S., et al.: Palm: scaling language modeling with pathways. J. Mach. Learn. Res. 24(240), 1\u2013113 (2023)","journal-title":"J. Mach. Learn. Res."},{"key":"5782_CR5","first-page":"1","volume":"10","author":"D Patel","year":"2023","unstructured":"Patel, D., Wong, G.: Gpt-4 architecture, infrastructure, training dataset, costs, vision, moe. Demystifying GPT-4: The Engineering Tradeoffs That Led OpenAI to Their Architecture. SemiAnalysis 10, 1\u201317 (2023)","journal-title":"Demystifying GPT-4: The Engineering Tradeoffs That Led OpenAI to Their Architecture. SemiAnalysis"},{"key":"5782_CR6","unstructured":"Elias, J.: Google\u2019s newest A.I. model uses nearly five times more text data for training than its predecessor. [Online]. https:\/\/www.cnbc.com\/2023\/05\/16\/googles-palm-2-uses-nearly-five-times-more-text-data-than-predecessor.html"},{"key":"5782_CR7","unstructured":"Introducing Llama 3.1: Our most capable models to date. [Online]. https:\/\/ai.meta.com\/blog\/meta-llama-3-1\/"},{"key":"5782_CR8","unstructured":"Nvidia H200 tensor core GPU. [Online]. https:\/\/www.nvidia.com\/en-us\/data-center\/h200\/"},{"key":"5782_CR9","doi-asserted-by":"crossref","unstructured":"Sharma, D.D.: Compute express link\u00ae: an open industry-standard interconnect enabling heterogeneous data-centric computing. In: 2022 IEEE Symposium on High-Performance Interconnects (HOTI), pp. 5\u201312 (2022). IEEE","DOI":"10.1109\/HOTI55740.2022.00017"},{"key":"5782_CR10","doi-asserted-by":"crossref","unstructured":"Jung, M.: Hello bytes, bye blocks: pcie storage meets compute express link for memory expansion (cxl-ssd). In: Proceedings of the 14th ACM Workshop on Hot Topics in Storage and File Systems, pp. 45\u201351 (2022)","DOI":"10.1145\/3538643.3539745"},{"issue":"2","key":"5782_CR11","doi-asserted-by":"publisher","first-page":"20","DOI":"10.1109\/MM.2023.3240774","volume":"43","author":"K Kim","year":"2023","unstructured":"Kim, K., Kim, H., So, J., Lee, W., Im, J., Park, S., Cho, J., Song, H.: Smt: software-defined memory tiering for heterogeneous computing systems with cxl memory expander. IEEE Micro 43(2), 20\u201329 (2023)","journal-title":"IEEE Micro"},{"key":"5782_CR12","doi-asserted-by":"crossref","unstructured":"Lee, K., Kim, S., Lee, J., Moon, D., Kim, R., Kim, H., Ji, H., Mun, Y., Joo, Y.: Improving key-value cache performance with heterogeneous memory tiering: A case study of cxl-based memory expansion. IEEE Micro (2024)","DOI":"10.1109\/MM.2024.3358861"},{"key":"5782_CR13","doi-asserted-by":"crossref","unstructured":"Arif, M., Assogba, K., Rafique, M.M., Vazhkudai, S.: Exploiting cxl-based memory for distributed deep learning. In: Proceedings of the 51st International Conference on Parallel Processing, pp. 1\u201311 (2022)","DOI":"10.1145\/3545008.3545054"},{"key":"5782_CR14","doi-asserted-by":"crossref","unstructured":"Kwon, M., Lee, S., Jung, M.: Cache in hand: expander-driven cxl prefetcher for next generation cxl-ssd. In: Proceedings of the 15th ACM Workshop on Hot Topics in Storage and File Systems, pp. 24\u201330 (2023)","DOI":"10.1145\/3599691.3603406"},{"key":"5782_CR15","unstructured":"Yang, S.-P., Kim, M., Nam, S., Park, J., Choi, J.-Y., Nam, E.H., Lee, E., Lee, S., Kim, B.S.: Overcoming the Memory Wall with CXL-Enabled SSDs. In: 2023 USENIX Annual Technical Conference (USENIX ATC 23), pp. 601\u2013617 (2023)"},{"key":"5782_CR16","doi-asserted-by":"crossref","unstructured":"Michaud, P.: Best-offset hardware prefetching. In: 2016 IEEE International Symposium on High Performance Computer Architecture (HPCA), pp. 469\u2013480 (2016). IEEE","DOI":"10.1109\/HPCA.2016.7446087"},{"key":"5782_CR17","unstructured":"Tavakkol, A., G\u00f3mez-Luna, J., Sadrosadati, M., Ghose, S., Mutlu, O.: MQSim: a framework for enabling realistic studies of modern Multi-Queue SSD devices. In: 16th USENIX Conference on File and Storage Technologies (FAST 18), pp. 49\u201366 (2018)"},{"key":"5782_CR18","unstructured":"Xiang, L., Lin, Z., Deng, W., Lu, H., Rao, J., Yuan, Y., Wang, R.: Nomad: Non-Exclusive Memory Tiering via Transactional Page Migration. In: 18th USENIX Symposium on Operating Systems Design and Implementation (OSDI 24), pp. 19\u201335 (2024)"},{"key":"5782_CR19","doi-asserted-by":"crossref","unstructured":"Ham, H., Hong, J., Park, G., Shin, Y., Woo, O., Yang, W., Bae, J., Park, E., Sung, H., Lim, E., et al.: Low-overhead general-purpose near-data processing in cxl memory expanders. arXiv preprint arXiv:2404.19381 (2024)","DOI":"10.1109\/MICRO61859.2024.00051"},{"key":"5782_CR20","unstructured":"Zhou, Z., Chen, Y., Zhang, T., Wang, Y., Shu, R., Xu, S., Cheng, P., Qu, L., Xiong, Y., Sun, G.: Toward cxl-native memory tiering via device-side profiling. arXiv preprint arXiv:2403.18702 (2024)"},{"key":"5782_CR21","doi-asserted-by":"crossref","unstructured":"Gouk, D., Kang, S., Bae, H., Ryu, E., Lee, S., Kim, D., Jang, J., Jung, M.: Breaking barriers: expanding gpu memory with sub-two digit nanosecond latency cxl controller. In: Proceedings of the 16th ACM Workshop on Hot Topics in Storage and File Systems, pp. 108\u2013115 (2024)","DOI":"10.1145\/3655038.3665953"},{"key":"5782_CR22","doi-asserted-by":"crossref","unstructured":"Abdullah, R., Lee, H., Zhou, H., Awad, A.: Salus: efficient security support for cxl-expanded gpu memory. In: 2024 IEEE International Symposium on High-Performance Computer Architecture (HPCA), pp. 1\u201315 (2024). IEEE","DOI":"10.1109\/HPCA57654.2024.00027"},{"key":"5782_CR23","doi-asserted-by":"crossref","unstructured":"Ahn, M., Chang, A., Lee, D., Gim, J., Kim, J., Jung, J., Rebholz, O., Pham, V., Malladi, K., Ki, Y.S.: Enabling cxl memory expansion for in-memory database management systems. In: Proceedings of the 18th International Workshop on Data Management on New Hardware, pp. 1\u20135 (2022)","DOI":"10.1145\/3533737.3535090"},{"key":"5782_CR24","doi-asserted-by":"publisher","DOI":"10.14778\/3685800.3685809","author":"M Ahn","year":"2024","unstructured":"Ahn, M., Willhalm, T., May, N., Lee, D., Desai, S.M., Booss, D., Kim, J., Singh, N., Ritter, D., Rebholz, O.: An examination of cxl memory use cases for in-memory database management systems using sap hana. Proc. VLDB Endow (2024). https:\/\/doi.org\/10.14778\/3685800.3685809","journal-title":"Proc. VLDB Endow"},{"key":"5782_CR25","unstructured":"Lee, S., Lerner, A., Bonnet, P., Cudr\u00e9-Mauroux, P.: Database kernels: Seamless integration of database systems and fast storage via cxl. In: CIDR (2024)"},{"key":"5782_CR26","unstructured":"TensorFlow code and pre-trained models for BERT. [Online]. https:\/\/github.com\/google-research\/bert"},{"key":"5782_CR27","unstructured":"XZ utils. [Online]. https:\/\/www.tukaani.org\/xz\/"},{"key":"5782_CR28","unstructured":"GAP benchmark suite. [Online]. https:\/\/github.com\/ sbeamer\/gapbs"},{"key":"5782_CR29","unstructured":"Al\u00a0Maruf, H., Chowdhury, M.: Effectively prefetching remote memory with leap. In: 2020 USENIX Annual Technical Conference (USENIX ATC 20), pp. 843\u2013857 (2020)"},{"key":"5782_CR30","doi-asserted-by":"crossref","unstructured":"Srinath, S., Mutlu, O., Kim, H., Patt, Y.N.: Feedback directed prefetching: improving the performance and bandwidth-efficiency of hardware prefetchers. In: 2007 IEEE 13th International Symposium on High Performance Computer Architecture,\u00a0IEEE, pp. 63\u201374 (2007).\u00a0","DOI":"10.1109\/HPCA.2007.346185"}],"container-title":["Cluster Computing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10586-025-05782-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10586-025-05782-3","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10586-025-05782-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,19]],"date-time":"2026-03-19T13:08:37Z","timestamp":1773925717000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10586-025-05782-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,11,11]]},"references-count":30,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2026,2]]}},"alternative-id":["5782"],"URL":"https:\/\/doi.org\/10.1007\/s10586-025-05782-3","relation":{},"ISSN":["1386-7857","1573-7543"],"issn-type":[{"value":"1386-7857","type":"print"},{"value":"1573-7543","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,11,11]]},"assertion":[{"value":"1 March 2025","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"14 May 2025","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 September 2025","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"11 November 2025","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no competing interests.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"18"}}