{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,23]],"date-time":"2025-08-23T02:10:02Z","timestamp":1755915002518,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":20,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,10,2]],"date-time":"2023-10-02T00:00:00Z","timestamp":1696204800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"Los Alamos National Laboratory is managed by Triad National Security, LLC, for the National Nuclear Security Administration of the U.S. DOE under contract 89233218CNA000001. This work is partially supported by Triad National Security, LLC subcontract \\#581326.","award":["89233218CNA000001"],"award-info":[{"award-number":["89233218CNA000001"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,10,2]]},"DOI":"10.1145\/3631882.3631891","type":"proceedings-article","created":{"date-parts":[[2024,4,8]],"date-time":"2024-04-08T12:06:58Z","timestamp":1712578018000},"page":"1-3","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Modeling and Characterizing Shared and Local Memories of the Ampere GPUs"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-4542-6673","authenticated-orcid":false,"given":"Hamdy","family":"Abdelkhalik","sequence":"first","affiliation":[{"name":"New Mexico State University, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5186-3012","authenticated-orcid":false,"given":"Yehia","family":"Arafa","sequence":"additional","affiliation":[{"name":"New Mexico State University, USA and Qualcomm, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4755-7821","authenticated-orcid":false,"given":"Nandakishore","family":"Santhi","sequence":"additional","affiliation":[{"name":"Los Alamos National Laboratory, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7558-0340","authenticated-orcid":false,"given":"Nirmal","family":"Prajapati","sequence":"additional","affiliation":[{"name":"Los Alamos National Laboratory, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8027-1449","authenticated-orcid":false,"given":"Abdel-Hameed A.","family":"Badawy","sequence":"additional","affiliation":[{"name":"New Mexico State University, USA and Los Alamos National Laboratory, USA"}]}],"member":"320","published-online":{"date-parts":[[2024,4,8]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"DeepBench. https:\/\/svail.github.io\/DeepBench\/."},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1109\/HPEC55821.2022.9926299"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1145\/3392717.3392761"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/3458817.3476221"},{"key":"e_1_3_2_1_5_1","unstructured":"Yehia Arafa Abdel-Hameed\u00a0A. Badawy Gopinath Chennupati Nandakishore Santhi and Stephan Eidenbenz. PPT-GPU Tool. https:\/\/github.com\/lanl\/PPT"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1109\/LCA.2019.2904497"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1109\/ISPASS.2009.4919648"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1109\/MASCOTS.2010.43"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1145\/1735688.1735696"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA45697.2020.00047"},{"key":"e_1_3_2_1_11_1","volume-title":"Automation & Test in Europe Conference & Exhibition (DATE). 1273\u20131278","author":"Li Ang","year":"2016","unstructured":"Ang Li, Shuaiwen\u00a0Leon Song, Akash Kumar, Eddy\u00a0Z. Zhang, Daniel Chavarr\u00eda-Miranda, and Henk Corporaal. 2016. Critical points based register-concurrency autotuning for GPUs. In 2016 Design, Automation & Test in Europe Conference & Exhibition (DATE). 1273\u20131278."},{"key":"e_1_3_2_1_12_1","unstructured":"NVIDIA. CUDA Binary Utilities. https:\/\/docs.nvidia.com\/cuda\/cuda-binary-utilities\/"},{"key":"e_1_3_2_1_13_1","unstructured":"NVIDIA. NVIDIA A100 whitepaper. https:\/\/images.nvidia.com\/aem-dam\/en-zz\/Solutions\/data-center\/nvidia-ampere-architecture-whitepaper.pdf"},{"key":"e_1_3_2_1_14_1","unstructured":"NVIDIA. NVIDIA Ampere Architecture In-Depth | NVIDIA Developer Blog. https:\/\/developer.nvidia.com\/blog\/nvidia-ampere-architecture-in-depth\/"},{"key":"e_1_3_2_1_15_1","unstructured":"NVIDIA. NVIDIA Nsight Systems. https:\/\/developer.nvidia.com\/nsight-systems"},{"key":"e_1_3_2_1_16_1","volume-title":"arXiv preprint arXiv:1907.02894","author":"Sakdhnagool Putt","year":"2019","unstructured":"Putt Sakdhnagool, Amit Sabne, and Rudolf Eigenmann. 2019. arXiv preprint arXiv:1907.02894 (2019)."},{"key":"e_1_3_2_1_17_1","unstructured":"Vijay Thakkar Pradeep Ramani Cris Cecka Aniket Shivam Honghao Lu Ethan Yan Jack Kosaian Mark Hoemmen Haicheng Wu Andrew Kerr Matt Nicely Duane Merrill Dustyn Blasig Fengqi Qiao Piotr Majcher Paul Springer Markus Hohnerbach Jin Wang and Manish Gupta. 2023. CUTLASS. https:\/\/github.com\/NVIDIA\/cutlass."},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1145\/2370816.2370865"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1145\/3352460.3358307"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1145\/2830772.2830813"}],"event":{"name":"MEMSYS '23: The International Symposium on Memory Systems","acronym":"MEMSYS '23","location":"Alexandria VA USA"},"container-title":["Proceedings of the International Symposium on Memory Systems"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3631882.3631891","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3631882.3631891","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,23]],"date-time":"2025-08-23T01:35:54Z","timestamp":1755912954000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3631882.3631891"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,10,2]]},"references-count":20,"alternative-id":["10.1145\/3631882.3631891","10.1145\/3631882"],"URL":"https:\/\/doi.org\/10.1145\/3631882.3631891","relation":{},"subject":[],"published":{"date-parts":[[2023,10,2]]},"assertion":[{"value":"2024-04-08","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}