{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,10]],"date-time":"2025-10-10T01:23:43Z","timestamp":1760059423336,"version":"build-2065373602"},"publisher-location":"New York, NY, USA","reference-count":22,"publisher":"ACM","funder":[{"name":"JHPCN","award":["jh251003"],"award-info":[{"award-number":["jh251003"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,10,12]]},"DOI":"10.1145\/3725783.3764411","type":"proceedings-article","created":{"date-parts":[[2025,10,9]],"date-time":"2025-10-09T17:50:12Z","timestamp":1760032212000},"page":"61-67","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Chimera-VDB: Mixed-Precision Vector Database with HNSW Index for RAG-LLM"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0006-9482-719X","authenticated-orcid":false,"given":"Naoshi","family":"Yamane","sequence":"first","affiliation":[{"name":"Tohoku University, Sendai, Miyagi, Japan"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0996-0051","authenticated-orcid":false,"given":"Michael Ryan","family":"Zielewski","sequence":"additional","affiliation":[{"name":"Tohoku University, Sendai, Miyagi, Japan"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-1917-2742","authenticated-orcid":false,"given":"Takaki","family":"Nakamura","sequence":"additional","affiliation":[{"name":"Tohoku University, Sendai, Miyagi, Japan"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5798-5125","authenticated-orcid":false,"given":"Takuo","family":"Suganuma","sequence":"additional","affiliation":[{"name":"Tohoku University, Sendai, Miyagi, Japan"}]}],"member":"320","published-online":{"date-parts":[[2025,10,11]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"RAG makes LLMs better and equal. (Jan","author":"Catav Amnon","year":"2024","unstructured":"Amnon Catav, Roy Miara, Ilai Giloh, Nathan Cordeiro, and Amir Ingber. 2024. RAG makes LLMs better and equal. (Jan. 2024). Retrieved Jun 3, 2025 from https:\/\/www.pinecone.io\/blog\/rag-study\/."},{"key":"e_1_3_2_1_2_1","volume-title":"International Conference on ICT Innovations. Springer, 3\u201318","author":"Filipovska Elena","year":"2024","unstructured":"Elena Filipovska, Ana Mladenovska, Jovana Dobreva, Dimitar Kitanovski, Goran Mitrov, Petre Lameski, and Eftim Zdravevski. 2024. Evaluation of vector databases and LLMs in RAG-based multi-document question answering. In International Conference on ICT Innovations. Springer, 3\u201318."},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1145\/3654970"},{"key":"e_1_3_2_1_4_1","volume-title":"International Conference on Machine Learning. https:\/\/arxiv.org\/abs\/1908","author":"Guo Ruiqi","year":"2020","unstructured":"Ruiqi Guo, Philip Sun, Erik Lindgren, Quan Geng, David Simcha, Felix Chern, and Sanjiv Kumar. 2020. Accelerating large-scale inference with anisotropic vector quantization. In International Conference on Machine Learning. https:\/\/arxiv.org\/abs\/1908.10396."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00286"},{"key":"e_1_3_2_1_6_1","volume-title":"Ravishankar Krishnawamy, and Rohan Kadekodi.","author":"Subramanya Suhas Jayaram","year":"2019","unstructured":"Suhas Jayaram Subramanya, Fnu Devvrit, Harsha Vardhan Simhadri, Ravishankar Krishnawamy, and Rohan Kadekodi. 2019. Diskann: fast accurate billion-point nearest neighbor search on a single node. Advances in neural information processing Systems, 32."},{"key":"e_1_3_2_1_7_1","volume-title":"Product quantization for nearest neighbor search","author":"Jegou Herve","unstructured":"Herve Jegou, Matthijs Douze, and Cordelia Schmid. 2010. Product quantization for nearest neighbor search. IEEE transactions on pattern analysis and machine intelligence, 33, 1, 117\u2013128."},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2011.5946540"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICMLA61862.2024.00156"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"crossref","unstructured":"Chao Jin Zili Zhang Xuanlin Jiang Fangyue Liu Xin Liu Xuanzhe Liu and Xin Jin. 2024. RAGCache: Efficient knowledge caching for retrieval-augmented generation. arXiv preprint arXiv:2404.12457.","DOI":"10.1145\/3768628"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1109\/AIxMM62960.2025.00008"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1145\/3184558.3192301"},{"key":"e_1_3_2_1_13_1","volume-title":"Efficient and robust approximate nearest neighbor search using hierarchical navigable small world graphs","author":"Malkov Yu A","unstructured":"Yu A Malkov and Dmitry A Yashunin. 2018. Efficient and robust approximate nearest neighbor search using hierarchical navigable small world graphs. IEEE transactions on pattern analysis and machine intelligence, 42, 4, 824\u2013836."},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCT-Pacific63901.2025.11012786"},{"key":"e_1_3_2_1_15_1","volume-title":"Retrieved","year":"2025","unstructured":"Microsoft. 2025. (2025). Retrieved Aug, 2025 from https:\/\/github.com\/microsoft\/SPTAG\/tree\/main\/datasets\/SPACEV1B."},{"key":"e_1_3_2_1_16_1","volume-title":"Retrieved","year":"2025","unstructured":"OpenSearch. 2025. (2025). Retrieved May 28, 2025 from https:\/\/opensearch.org\/."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1007\/s00778-024-00864-x"},{"key":"e_1_3_2_1_18_1","volume-title":"Retrieved","year":"2025","unstructured":"Qdrant. 2025. (2025). Retrieved May 28, 2025 from https:\/\/qdrant.tech\/."},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"crossref","unstructured":"Toyotaro Suzumura et al. 2022. mdx: A cloud platform for supporting data science and cross-disciplinary research collaborations. In 2022 IEEE Intl Conf on Dependable Autonomic and Secure Computing Intl Conf on Pervasive Intelligence and Computing Intl Conf on Cloud and Big Data Computing Intl Conf on Cyber Science and Technology Congress (DASC\/PiCom\/CBDCom\/CyberSciTech). IEEE 1\u20137.","DOI":"10.1109\/DASC\/PiCom\/CBDCom\/Cy55231.2022.9927822"},{"key":"e_1_3_2_1_20_1","unstructured":"Liang Wang Nan Yang Xiaolong Huang Linjun Yang Rangan Majumder and Furu Wei. 2024. Multilingual e5 text embeddings: A technical report. arXiv preprint arXiv:2402.05672."},{"key":"e_1_3_2_1_21_1","volume-title":"Retrieved","year":"2025","unstructured":"Weaviate. 2025. (2025). Retrieved May 28, 2025 from https:\/\/weaviate.io\/."},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"crossref","unstructured":"Hailin Zhang Penghao Zhao Xupeng Miao Yingxia Shao Zirui Liu Tong Yang and Bin Cui. 2023. Experimental analysis of large-scale learnable vector storage compression. arXiv preprint arXiv:2311.15578.","DOI":"10.14778\/3636218.3636234"}],"event":{"name":"APSys '25: 16th ACM SIGOPS Asia-Pacific Workshop on Systems","location":"Lotte Hotel World, Emerald Hall Seoul Republic of Korea","acronym":"APSys '25","sponsor":["SIGOPS ACM Special Interest Group on Operating Systems"]},"container-title":["Proceedings of the 16th ACM SIGOPS Asia-Pacific Workshop on Systems"],"original-title":[],"deposited":{"date-parts":[[2025,10,9]],"date-time":"2025-10-09T17:52:35Z","timestamp":1760032355000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3725783.3764411"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,11]]},"references-count":22,"alternative-id":["10.1145\/3725783.3764411","10.1145\/3725783"],"URL":"https:\/\/doi.org\/10.1145\/3725783.3764411","relation":{},"subject":[],"published":{"date-parts":[[2025,10,11]]},"assertion":[{"value":"2025-10-11","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}