{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,30]],"date-time":"2026-03-30T14:03:16Z","timestamp":1774879396133,"version":"3.50.1"},"publisher-location":"Singapore","reference-count":38,"publisher":"Springer Nature Singapore","isbn-type":[{"value":"9789819584130","type":"print"},{"value":"9789819584147","type":"electronic"}],"license":[{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026]]},"DOI":"10.1007\/978-981-95-8414-7_25","type":"book-chapter","created":{"date-parts":[[2026,3,30]],"date-time":"2026-03-30T13:15:02Z","timestamp":1774876502000},"page":"447-466","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["DiffGen: Optimizing I\/O Trace Generation with\u00a0Differentiated Modeling Techniques"],"prefix":"10.1007","author":[{"given":"Jian","family":"Liu","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhiyang","family":"Feng","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ziguang","family":"Fu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Guodao","family":"Sun","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yilong","family":"Zhang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Nan","family":"Gao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ronghua","family":"Liang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Peng","family":"Chen","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Li","family":"Jiang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2026,3,31]]},"reference":[{"issue":"4","key":"25_CR1","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/2078861.2078864","volume":"7","author":"DT Meyer","year":"2012","unstructured":"Meyer, D.T., Bolosky, W.J.: A study of practical deduplication. ACM Trans. Storage (ToS) 7(4), 1\u201320 (2012)","journal-title":"ACM Trans. Storage (ToS)"},{"key":"25_CR2","unstructured":"Ding, X., Jiang, S., Chen, F., et al.: DiskSeen: exploiting disk layout and access history to enhance I\/O prefetch. In: USENIX Annual Technical Conference, pp. 261\u2013274 (2007)"},{"key":"25_CR3","unstructured":"Ousterhout, A., Fried, J., Behrens, J., et al.: Shenango: achieving high CPU efficiency for latency-sensitive datacenter workloads. In: 16th USENIX Symposium on Networked Systems Design and Implementation (NSDI 2019), pp. 361\u2013378 (2019)"},{"key":"25_CR4","doi-asserted-by":"crossref","unstructured":"Sharma, B., Jayachandran, P., Verma, A., et al.: CloudPD: problem determination and diagnosis in shared dynamic clouds. In: 2013 43rd Annual IEEE\/IFIP International Conference on Dependable Systems and Networks (DSN), pp. 1\u201312. IEEE (2013)","DOI":"10.1109\/DSN.2013.6575298"},{"key":"25_CR5","doi-asserted-by":"crossref","unstructured":"Li, B., Toussi, F., Anderson, C., et al.: Tracerar: an I\/O performance evaluation tool for replaying, analyzing, and regenerating traces. In: 2017 International Conference on Networking, Architecture, and Storage (NAS), pp. 1\u201310. IEEE (2017)","DOI":"10.1109\/NAS.2017.8026880"},{"key":"25_CR6","doi-asserted-by":"crossref","unstructured":"Sabnis, A., Sitaraman, R.K.: TRAGEN: a synthetic trace generator for realistic cache simulations. In: Proceedings of the 21st ACM Internet Measurement Conference, pp. 366\u2013379 (2021)","DOI":"10.1145\/3487552.3487845"},{"key":"25_CR7","doi-asserted-by":"crossref","unstructured":"Sabnis, A., Sitaraman, R.K.: JEDI: model-driven trace generation for cache simulations. In: Proceedings of the 22nd ACM Internet Measurement Conference, pp. 679\u2013693 (2022)","DOI":"10.1145\/3517745.3561466"},{"key":"25_CR8","doi-asserted-by":"crossref","unstructured":"Zhang, H., Yang, Z., Xie, Y., et al.: Accurate generation of I\/O workloads using generative adversarial networks. In: 2024 International Conference on Networking, Architecture and Storage (NAS), pp. 1\u20139. IEEE (2024)","DOI":"10.1109\/NAS63802.2024.10781347"},{"key":"25_CR9","doi-asserted-by":"crossref","unstructured":"Huang, K., Li, X., Yuan, M., et al.: Joint directory, file and IO trace feature extraction and feature-based trace regeneration for enterprise storage systems. In: 2024 IEEE 40th International Conference on Data Engineering (ICDE), pp. 4002\u20134015. IEEE (2024)","DOI":"10.1109\/ICDE60146.2024.00307"},{"key":"25_CR10","doi-asserted-by":"crossref","unstructured":"Sundarrajan, A., Feng, M., Kasbekar, M., et al.: Footprint descriptors: theory and practice of cache provisioning in a global CDN. In: Proceedings of the 13th International Conference on Emerging Networking Experiments and Technologies, pp. 55\u201367 (2017)","DOI":"10.1145\/3143361.3143368"},{"key":"25_CR11","doi-asserted-by":"crossref","unstructured":"LeCun, Y., Bottou, L., Orr, G.B., et al.: Efficient backprop. In: Neural Networks: Tricks of the Trade, pp. 9\u201350. Springer, Heidelberg (2002)","DOI":"10.1007\/3-540-49430-8_2"},{"issue":"1","key":"25_CR12","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1023\/A:1010933404324","volume":"45","author":"L Breiman","year":"2001","unstructured":"Breiman, L.: Random forests. Mach. Learn. 45(1), 5\u201332 (2001)","journal-title":"Mach. Learn."},{"key":"25_CR13","doi-asserted-by":"crossref","unstructured":"Breiman, L., Friedman, J., Olshen, R.A., et al.: Classification and Regression Trees. Routledge (2017)","DOI":"10.1201\/9781315139470"},{"issue":"3","key":"25_CR14","doi-asserted-by":"publisher","first-page":"273","DOI":"10.1023\/A:1022627411411","volume":"20","author":"C Cortes","year":"1995","unstructured":"Cortes, C., Vapnik, V.: Support-vector networks. Mach. Learn. 20(3), 273\u2013297 (1995)","journal-title":"Mach. Learn."},{"issue":"1","key":"25_CR15","doi-asserted-by":"publisher","first-page":"21","DOI":"10.1109\/TIT.1967.1053964","volume":"13","author":"T Cover","year":"1967","unstructured":"Cover, T., Hart, P.: Nearest neighbor pattern classification. IEEE Trans. Inf. Theory 13(1), 21\u201327 (1967)","journal-title":"IEEE Trans. Inf. Theory"},{"key":"25_CR16","unstructured":"Duda, R.O., Hart, P.E.: Pattern Classification and Scene Analysis. Wiley-Interscience (1973)"},{"key":"25_CR17","unstructured":"Virtanen, P., Gommers, R., Oliphant, T.E., et al.: SciPy 1.0: fundamental algorithms for scientific computing in Python. Nat. Methods 17(3), 261\u2013272 (2020)"},{"key":"25_CR18","unstructured":"Talwadker, R., Voruganti, K.: ParaSwift: file I\/O trace modeling for the future. In: 28th Large Installation System Administration Conference (LISA 2014), pp. 128\u2013141 (2014)"},{"key":"25_CR19","unstructured":"Kingma, D.P., Ba, J.: Adam: a method for stochastic optimization. arXiv preprint arXiv:1412.6980 (2014)"},{"key":"25_CR20","unstructured":"Goodfellow, I., Bengio, Y., Courville, A.: Deep Learning. MIT Press (2016)"},{"key":"25_CR21","doi-asserted-by":"crossref","unstructured":"Gretton, A., Borgwardt, K., Rasch, M., et al.: A kernel method for the two-sample-problem. In: Advances in Neural Information Processing Systems, pp. 513\u2013520 (2006)","DOI":"10.7551\/mitpress\/7503.003.0069"},{"issue":"4","key":"25_CR22","doi-asserted-by":"publisher","first-page":"679","DOI":"10.1016\/j.ijforecast.2006.03.001","volume":"22","author":"RJ Hyndman","year":"2006","unstructured":"Hyndman, R.J., Koehler, A.B.: Another look at measures of forecast accuracy. Int. J. Forecast. 22(4), 679\u2013688 (2006)","journal-title":"Int. J. Forecast."},{"key":"25_CR23","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-14142-8","volume-title":"Data Mining: The Textbook","author":"CC Aggarwal","year":"2015","unstructured":"Aggarwal, C.C.: Data Mining: The Textbook. Springer, New York (2015)"},{"issue":"1","key":"25_CR24","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3423137","volume":"17","author":"G Yadgar","year":"2021","unstructured":"Yadgar, G., Gabel, M., Jaffer, S., et al.: SSD-based workload characteristics and their performance implications. ACM Trans. Storage (TOS) 17(1), 1\u201326 (2021)","journal-title":"ACM Trans. Storage (TOS)"},{"key":"25_CR25","unstructured":"Wong, D.L.K., Wu, H., Molder, C., et al.: Baleen: ML admission & prefetching for flash caches. In: 22nd USENIX Conference on File and Storage Technologies (FAST 2024), pp. 347\u2013371 (2024)"},{"key":"25_CR26","doi-asserted-by":"crossref","unstructured":"Lee, C., Kumano, T., Matsuki, T., et al.: Understanding storage traffic characteristics on enterprise virtual desktop infrastructure. In: Proceedings of the 10th ACM International Systems and Storage Conference, pp. 1\u201311 (2017)","DOI":"10.1145\/3078468.3078479"},{"key":"25_CR27","doi-asserted-by":"publisher","DOI":"10.1016\/j.softx.2024.102018","volume":"29","author":"J Liu","year":"2025","unstructured":"Liu, J., Chen, Y., Ding, H.: CacheSim: a cache simulation framework for evaluating caching algorithms on resource-constrained edge devices. SoftwareX 29, 102018 (2025)","journal-title":"SoftwareX"},{"key":"25_CR28","unstructured":"Vaswani, A., Shazeer, N., Parmar, N., et al.: Attention is all you need. In: Advances in Neural Information Processing Systems. MIT Press (2017)"},{"issue":"8","key":"25_CR29","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S Hochreiter","year":"1997","unstructured":"Hochreiter, S., Schmidhuber, J.: Long short-term memory. Neural Comput. 9(8), 1735\u20131780 (1997). https:\/\/doi.org\/10.1162\/neco.1997.9.8.1735","journal-title":"Neural Comput."},{"key":"25_CR30","doi-asserted-by":"crossref","unstructured":"Rumelhart, D.E., McClelland, J.L.: Learning internal representations by error propagation. In: Parallel Distributed Processing: Explorations in the Microstructure of Cognition: Foundations, pp. 318\u2013362. MIT Press (1987)","DOI":"10.7551\/mitpress\/4943.003.0128"},{"key":"25_CR31","unstructured":"Haghdoost, A., He, W., Fredin, J., et al.: On the accuracy and scalability of intensive I\/O workload replay. In: 15th USENIX Conference on File and Storage Technologies (FAST 2017), pp. 315\u2013328 (2017)"},{"key":"25_CR32","doi-asserted-by":"crossref","unstructured":"Sajal, S.M., Zhu, T., Urgaonkar, B., et al.: Traceupscaler: upscaling traces to evaluate systems at high load. In: Proceedings of the Nineteenth European Conference on Computer Systems, pp. 942\u2013961 (2024)","DOI":"10.1145\/3627703.3629581"},{"key":"25_CR33","doi-asserted-by":"crossref","unstructured":"Sajal, S.M., Estyak, M.S., Hasan, R., et al.: TraceScaler: a framework for scaling load in real-world traces for system evaluation. ACM Trans. Comput. Syst. (2025)","DOI":"10.1145\/3760774"},{"key":"25_CR34","doi-asserted-by":"crossref","unstructured":"Anand, V., Stolet, M., Mace, J., et al.: Generating representative macrobenchmark microservice systems from distributed traces with Palette. arXiv preprint arXiv:2506.06448 (2025)","DOI":"10.1145\/3725783.3764387"},{"key":"25_CR35","doi-asserted-by":"crossref","unstructured":"Li, C., Wei, J., Xie, H., et al.: TraceGen: a block-level storage system performance evaluation tool for analyzing and generating I\/O traces. In: 2024 IEEE International Conference on High Performance Computing and Communications (HPCC), pp. 152\u2013159. IEEE (2024)","DOI":"10.1109\/HPCC64274.2024.00030"},{"key":"25_CR36","doi-asserted-by":"crossref","unstructured":"Muttillo, V., Di Sipio, C., Rubei, R., et al.: Towards synthetic trace generation of modeling operations using in-context learning approach. In: Proceedings of the 39th IEEE\/ACM International Conference on Automated Software Engineering, pp. 619\u2013630 (2024)","DOI":"10.1145\/3691620.3695058"},{"key":"25_CR37","doi-asserted-by":"crossref","unstructured":"Kim, D., Ravula, S., Ha, T., et al.: Large language models as realistic microservice trace generators. arXiv preprint arXiv:2502.17439 (2024)","DOI":"10.18653\/v1\/2025.emnlp-main.4"},{"key":"25_CR38","doi-asserted-by":"crossref","unstructured":"Paul, A.K., Choi, J.Y., Karimi, A.M., et al.: Machine learning assisted HPC workload trace generation for leadership scale storage systems. In: Proceedings of the 31st International Symposium on High-Performance Parallel and Distributed Computing, pp. 199\u2013212 (2022)","DOI":"10.1145\/3502181.3531457"}],"container-title":["Lecture Notes in Computer Science","Algorithms and Architectures for Parallel Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-95-8414-7_25","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,30]],"date-time":"2026-03-30T13:15:09Z","timestamp":1774876509000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-95-8414-7_25"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026]]},"ISBN":["9789819584130","9789819584147"],"references-count":38,"URL":"https:\/\/doi.org\/10.1007\/978-981-95-8414-7_25","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026]]},"assertion":[{"value":"31 March 2026","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ICA3PP","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Algorithms and Architectures for Parallel Processing","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Zhengzhou","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"China","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"30 October 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2 November 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"25","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"ica3pp2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/ieee-cybermatics.org\/2025\/ica3pp\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}