{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,2]],"date-time":"2025-08-02T16:26:29Z","timestamp":1754151989817,"version":"3.41.2"},"publisher-location":"New York, NY, USA","reference-count":7,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,5,28]]},"DOI":"10.1145\/3719276.3727954","type":"proceedings-article","created":{"date-parts":[[2025,7,4]],"date-time":"2025-07-04T05:00:46Z","timestamp":1751605246000},"page":"224-225","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["POSTER: V-Seek: Optimizing LLM Reasoning on A Server-Class General-Purpose RISC-V Platform"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0003-3115-3464","authenticated-orcid":false,"given":"Javier Jesus","family":"Poveda Rodrigo","sequence":"first","affiliation":[{"name":"Politecnico di Torino, Turin, Italy"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-0539-5007","authenticated-orcid":false,"given":"Mohamed Amine","family":"Hamdi","sequence":"additional","affiliation":[{"name":"Politecnico di Torino, Turin, Italy"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-9771-1691","authenticated-orcid":false,"given":"Cyril","family":"Koenig","sequence":"additional","affiliation":[{"name":"ETH Z\u00fcrich, Zurich, Switzerland"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6215-8220","authenticated-orcid":false,"given":"Alessio","family":"Burrello","sequence":"additional","affiliation":[{"name":"Politecnico di Torino, Turin, Italy"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2872-7071","authenticated-orcid":false,"given":"Daniele","family":"Jahier Pagliari","sequence":"additional","affiliation":[{"name":"Politecnico di Torino, Turin, Italy"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8068-3806","authenticated-orcid":false,"given":"Luca","family":"Benini","sequence":"additional","affiliation":[{"name":"ETH Z\u00fcrich, Zurich, Switzerland"}]}],"member":"320","published-online":{"date-parts":[[2025,7,4]]},"reference":[{"doi-asserted-by":"crossref","unstructured":"Nick Brown and Maurice Jamieson. 2024. Performance characterisation of the 64-core SG2042 RISC-V CPU for HPC. arxiv:https:\/\/arXiv.org\/abs\/2406.12394\u00a0[cs.DC]","key":"e_1_3_3_1_2_2","DOI":"10.1007\/978-3-031-73716-9_25"},{"key":"e_1_3_3_1_3_2","volume-title":"ICPP \u201922","author":"al. Jiazhi\u00a0Jiang et","year":"2023","unstructured":"Jiazhi\u00a0Jiang et al.2023. Characterizing and Optimizing Transformer Inference on ARM Many-core Processor. In ICPP \u201922 (Bordeaux, France). Article 20, 11\u00a0pages."},{"unstructured":"Tommaso\u00a0Pegolotti et al.2023. QIGen: Generating Efficient Kernels for Quantized Inference on Large Language Models. arxiv:https:\/\/arXiv.org\/abs\/2307.03738\u00a0[cs.LG]","key":"e_1_3_3_1_4_2"},{"unstructured":"Zhihang\u00a0Yuan et al.2024. LLM Inference Unveiled: Survey and Roofline Model Insights. arxiv:https:\/\/arXiv.org\/abs\/2402.16363\u00a0[cs.CL] https:\/\/arxiv.org\/abs\/2402.16363","key":"e_1_3_3_1_5_2"},{"doi-asserted-by":"publisher","key":"e_1_3_3_1_6_2","DOI":"10.1145\/3650200.3656620"},{"unstructured":"Georgi Gerganov. 2025. llama.cpp. https:\/\/github.com\/ggerganov\/llama.cpp.","key":"e_1_3_3_1_7_2"},{"key":"e_1_3_3_1_8_2","volume-title":"RISC-V Summit Europe","author":"Wang Chiyo","year":"2024","unstructured":"Chiyo Wang. 2024. PerfXLM: A LLM Inference Engine on RISC-V CPUs. In RISC-V Summit Europe. Presented at the RISC-V Summit Europe 2024."}],"event":{"sponsor":["SIGMICRO ACM Special Interest Group on Microarchitectural Research and Processing"],"acronym":"CF '25","name":"CF '25: 22nd ACM International Conference on Computing Frontiers","location":"Cagliari Italy"},"container-title":["Proceedings of the 22nd ACM International Conference on Computing Frontiers"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3719276.3727954","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,21]],"date-time":"2025-07-21T09:48:36Z","timestamp":1753091316000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3719276.3727954"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,5,28]]},"references-count":7,"alternative-id":["10.1145\/3719276.3727954","10.1145\/3719276"],"URL":"https:\/\/doi.org\/10.1145\/3719276.3727954","relation":{},"subject":[],"published":{"date-parts":[[2025,5,28]]},"assertion":[{"value":"2025-07-04","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}