{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T05:05:29Z","timestamp":1750309529720,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":16,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,7,5]],"date-time":"2024-07-05T00:00:00Z","timestamp":1720137600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,7,5]]},"DOI":"10.1145\/3705956.3705968","type":"proceedings-article","created":{"date-parts":[[2024,12,28]],"date-time":"2024-12-28T11:29:57Z","timestamp":1735385397000},"page":"18-23","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Enhancing HyperAttention: A Novel Approach for Improved Algorithmic Efficiency"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0000-1259-756X","authenticated-orcid":false,"given":"Xinyi","family":"Xie","sequence":"first","affiliation":[{"name":"Faculty of Science and Technology, Beijing Normal University-Hong Kong Baptist University United International College, Zhuhai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-4383-6374","authenticated-orcid":false,"given":"Yi","family":"Ding","sequence":"additional","affiliation":[{"name":"School of Information Science and Technology, Xiamen University Tan Kan Kee College, Zhangzhou, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-3426-8219","authenticated-orcid":false,"given":"Chao","family":"Jiang","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, Dongguan University of Technology, Dongguan, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-1109-5975","authenticated-orcid":false,"given":"Tianyi","family":"Hang","sequence":"additional","affiliation":[{"name":"School of Information Science and Technology, Xi'an Jiaotong University, Xi'an, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0006-9672-9307","authenticated-orcid":false,"given":"Tianrun","family":"Lu","sequence":"additional","affiliation":[{"name":"Jinling College, Nanjing University, Heibei, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2024,12,28]]},"reference":[{"key":"e_1_3_3_1_1_2","volume-title":"Efficient large language models: A survey[J]. arXiv preprint arXiv:2312.03863","author":"Wan Z","year":"2023","unstructured":"Wan Z, Wang X, Liu C, et al. Efficient large language models: A survey[J]. arXiv preprint arXiv:2312.03863, 2023, 1."},{"key":"e_1_3_3_1_2_2","volume-title":"The Twelfth International Conference on Learning Representations","author":"Insu Han","year":"2024","unstructured":"Insu Han, Rajesh Jayaram, Amin Karbasi, Vahab Mirrokni, David Woodruff, and Amir Zandieh. Hyperattention: Long-context attention in near-linear time. In The Twelfth International Conference on Learning Representations, 2024."},{"key":"e_1_3_3_1_3_2","doi-asserted-by":"publisher","DOI":"10.1145\/276698.276876"},{"volume-title":"Vldb.","author":"Gionis","key":"e_1_3_3_1_4_2","unstructured":"Gionis, Aristides, Piotr Indyk, and Rajeev Motwani. \u201dSimilarity search in high dimensions via hashing.\u201d Vldb. Vol. 99. No. 6. 1999. https:\/\/dl.acm.org\/doi\/10.5555\/645925.671516"},{"key":"e_1_3_3_1_5_2","volume-title":"Attention is all you need.\u00a0Advances in Neural Information Processing Systems","author":"Vaswani A.","year":"2017","unstructured":"Vaswani, A. (2017). Attention is all you need.\u00a0Advances in Neural Information Processing Systems."},{"key":"e_1_3_3_1_6_2","volume-title":"Linformer: Self-attention with linear complexity.\u00a0arXiv preprint arXiv:2006.04768","author":"Wang S.","year":"2020","unstructured":"Wang, S., Li, B. Z., Khabsa, M., Fang, H., & Ma, H. (2020). Linformer: Self-attention with linear complexity.\u00a0arXiv preprint arXiv:2006.04768."},{"key":"e_1_3_3_1_7_2","volume-title":"Reformer: The efficient transformer.\u00a0arXiv preprint arXiv:2001.04451","author":"Kitaev N.","year":"2020","unstructured":"Kitaev, N., Kaiser, \u0141., & Levskaya, A. (2020). Reformer: The efficient transformer.\u00a0arXiv preprint arXiv:2001.04451."},{"key":"e_1_3_3_1_8_2","volume-title":"Longformer: The long-document transformer.\u00a0arXiv preprint arXiv:2004.05150","author":"Beltagy I.","year":"2020","unstructured":"Beltagy, I., Peters, M. E., & Cohan, A. (2020). Longformer: The long-document transformer.\u00a0arXiv preprint arXiv:2004.05150."},{"key":"e_1_3_3_1_9_2","volume-title":"Big bird: Transformers for longer sequences.\u00a0Advances in neural information processing systems,\u00a033, 17283-17297","author":"Zaheer M.","year":"2020","unstructured":"Zaheer, M., Guruganesh, G., Dubey, K. A., Ainslie, J., Alberti, C., Ontanon, S., ... & Ahmed, A. (2020). Big bird: Transformers for longer sequences.\u00a0Advances in neural information processing systems,\u00a033, 17283-17297."},{"key":"e_1_3_3_1_10_2","volume-title":"Rethinking attention with performers.\u00a0arXiv preprint arXiv:2009.14794","author":"Choromanski K.","year":"2020","unstructured":"Choromanski, K., Likhosherstov, V., Dohan, D., Song, X., Gane, A., Sarlos, T., ... & Weller, A. (2020). Rethinking attention with performers.\u00a0arXiv preprint arXiv:2009.14794."},{"key":"e_1_3_3_1_11_2","volume-title":"Flashattention: Fast and memory-efficient exact attention with io-awareness.\u00a0Advances in Neural Information Processing Systems,\u00a035, 16344-16359","author":"Dao T.","year":"2022","unstructured":"Dao, T., Fu, D., Ermon, S., Rudra, A., & R\u00e9, C. (2022). Flashattention: Fast and memory-efficient exact attention with io-awareness.\u00a0Advances in Neural Information Processing Systems,\u00a035, 16344-16359."},{"key":"e_1_3_3_1_12_2","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9781107298019"},{"key":"e_1_3_3_1_13_2","volume-title":"Some methods for classification and analysis of multivariate observations. In\u00a0Proceedings of 5-th Berkeley Symposium on Mathematical Statistics and Probability\/University of California Press","author":"MacQueen J.","year":"1967","unstructured":"MacQueen, J. (1967). Some methods for classification and analysis of multivariate observations. In\u00a0Proceedings of 5-th Berkeley Symposium on Mathematical Statistics and Probability\/University of California Press."},{"key":"e_1_3_3_1_14_2","doi-asserted-by":"crossref","unstructured":"Hartigan John A. and Manchek A. Wong. \u201dAlgorithm AS 136: A k-means clustering algorithm.\u201d Journal of the Royal Statistical Society. series c (applied statistics) 28.1 (1979): 100-108.","DOI":"10.2307\/2346830"},{"key":"e_1_3_3_1_15_2","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9781107298019"},{"key":"e_1_3_3_1_16_2","volume-title":"Attention is Naturally Sparse with Gaussian Distributed Input.\u00a0arXiv preprint arXiv:2404.02690","author":"Deng Y.","year":"2024","unstructured":"Deng, Y., Song, Z., & Yang, C. Attention is Naturally Sparse with Gaussian Distributed Input.\u00a0arXiv preprint arXiv:2404.02690, 2024."}],"event":{"name":"HPCCT 2024: 2024 8th High Performance Computing and Cluster Technologies Conference (HPCCT)","acronym":"HPCCT 2024","location":"Beijing China"},"container-title":["Proceedings of the 2024 8th High Performance Computing and Cluster Technologies Conference"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3705956.3705968","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3705956.3705968","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T01:18:13Z","timestamp":1750295893000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3705956.3705968"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,7,5]]},"references-count":16,"alternative-id":["10.1145\/3705956.3705968","10.1145\/3705956"],"URL":"https:\/\/doi.org\/10.1145\/3705956.3705968","relation":{},"subject":[],"published":{"date-parts":[[2024,7,5]]},"assertion":[{"value":"2024-12-28","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}