{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,11]],"date-time":"2026-04-11T02:10:07Z","timestamp":1775873407421,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":49,"publisher":"ACM","license":[{"start":{"date-parts":[[2022,6,11]],"date-time":"2022-06-11T00:00:00Z","timestamp":1654905600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2022,6,18]]},"DOI":"10.1145\/3470496.3533045","type":"proceedings-article","created":{"date-parts":[[2022,5,31]],"date-time":"2022-05-31T19:06:01Z","timestamp":1654023961000},"page":"1058-1070","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":5,"title":["Mixed-proxy extensions for the NVIDIA PTX memory consistency model"],"prefix":"10.1145","author":[{"given":"Daniel","family":"Lustig","sequence":"first","affiliation":[{"name":"NVIDIA"}]},{"given":"Simon","family":"Cooksey","sequence":"additional","affiliation":[{"name":"University of Kent, Canterbury, UK"}]},{"given":"Olivier","family":"Giroux","sequence":"additional","affiliation":[{"name":"NVIDIA"}]}],"member":"320","published-online":{"date-parts":[[2022,6,11]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-28756-5_15"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1145\/2694344.2694391"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1145\/1481839.1481842"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/2994593"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1145\/2594291.2594347"},{"key":"e_1_3_2_1_6_1","unstructured":"ARM. 2021. Arm Architecture Reference Manual Armv8 for A-Profile Architecture. https:\/\/developer.arm.com\/documentation\/ddi0487\/gb  ARM. 2021. Arm Architecture Reference Manual Armv8 for A-Profile Architecture. https:\/\/developer.arm.com\/documentation\/ddi0487\/gb"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-662-46669-8_12"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1145\/1926385.1926394"},{"key":"e_1_3_2_1_9_1","unstructured":"Hans-J. Boehm. 2013. Prohibiting \"Out of Thin Air\" Results in C++14. http:\/\/www.open-std.org\/jtc1\/sc22\/wg21\/docs\/papers\/2013\/n3786.htm.  Hans-J. Boehm. 2013. Prohibiting \"Out of Thin Air\" Results in C++14. http:\/\/www.open-std.org\/jtc1\/sc22\/wg21\/docs\/papers\/2013\/n3786.htm."},{"key":"e_1_3_2_1_10_1","volume-title":"Proceedings of the Twenty-Ninth International Conference on Programming Language Design and Implementation (PLDI).","author":"J.","unstructured":"Hans- J. Boehm and Sarita V. Adve. 2008. Foundations of the C++ Concurrency Memory Model . In Proceedings of the Twenty-Ninth International Conference on Programming Language Design and Implementation (PLDI). Hans-J. Boehm and Sarita V. Adve. 2008. Foundations of the C++ Concurrency Memory Model. In Proceedings of the Twenty-Ninth International Conference on Programming Language Design and Implementation (PLDI)."},{"key":"e_1_3_2_1_11_1","unstructured":"Hans-J. Boehm Mark Batty Olivier Giroux Paul McKenney Peter Sewell and Francesco Zappa Nardelli. 2013. Specifying the Absence of \"Out of Thin Air\" Results. http:\/\/www.open-std.org\/jtc1\/sc22\/wg21\/docs\/papers\/2013\/n3710.html.  Hans-J. Boehm Mark Batty Olivier Giroux Paul McKenney Peter Sewell and Francesco Zappa Nardelli. 2013. Specifying the Absence of \"Out of Thin Air\" Results. http:\/\/www.open-std.org\/jtc1\/sc22\/wg21\/docs\/papers\/2013\/n3710.html."},{"key":"e_1_3_2_1_12_1","volume-title":"Proceedings of the Workshop on Memory Systems Performance and Correctness (MSPC).","author":"J.","unstructured":"Hans- J. Boehm and Brian Demsky. 2014. Outlawing Ghosts: Avoiding Out-ofthin-air Results . In Proceedings of the Workshop on Memory Systems Performance and Correctness (MSPC). Hans-J. Boehm and Brian Demsky. 2014. Outlawing Ghosts: Avoiding Out-ofthin-air Results. In Proceedings of the Workshop on Memory Systems Performance and Correctness (MSPC)."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/3062341.3062353"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1145\/782814.782854"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1145\/3009837.3009839"},{"key":"e_1_3_2_1_16_1","unstructured":"HSA Foundation. 2015. HSA Platform System Architecture Specification. http:\/\/www.hsafoundation.com\/html\/Content\/PRM\/Topics\/06_Memory\/memory_model.htm.  HSA Foundation. 2015. HSA Platform System Architecture Specification. http:\/\/www.hsafoundation.com\/html\/Content\/PRM\/Topics\/06_Memory\/memory_model.htm."},{"key":"e_1_3_2_1_17_1","unstructured":"RISC-V Foundation. 2022. The RISC-V Instruction Set Manual Volume I: Unprivileged ISA. https:\/\/riscv.org.  RISC-V Foundation. 2022. The RISC-V Instruction Set Manual Volume I: Unprivileged ISA. https:\/\/riscv.org."},{"key":"e_1_3_2_1_18_1","unstructured":"Matt Godbolt. 2022. Compiler Explorer. https:\/\/godbolt.org\/  Matt Godbolt. 2022. Compiler Explorer. https:\/\/godbolt.org\/"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1145\/2541940.2541981"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1145\/505145.505149"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1145\/2933575.2934536"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1145\/3498716"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/3009837.3009850"},{"key":"e_1_3_2_1_24_1","unstructured":"Khronos Vulkan Working Group. 2018. Vulkan 1.1.92 - A Specification. https:\/\/www.khronos.org\/registry\/vulkan\/specs\/1.1-extensions\/html\/vkspec.html.  Khronos Vulkan Working Group. 2018. Vulkan 1.1.92 - A Specification. https:\/\/www.khronos.org\/registry\/vulkan\/specs\/1.1-extensions\/html\/vkspec.html."},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1145\/2261417.2261438"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/3062341.3062352"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/3297858.3304043"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1145\/3037697.3037723"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-31424-7_36"},{"key":"e_1_3_2_1_30_1","volume-title":"ArXiv","author":"Manerkar Yatin A.","unstructured":"Yatin A. Manerkar , Caroline Trippel , Daniel Lustig , Michael Pellauer , and Margaret Martonosi . 2016. Counterexamples and Proof Loophole for the C\/C++ to POWER and ARMv7 Trailing-Sync Compiler Mappings . In ArXiv , Vol. abs\/ 1611 .01507. Yatin A. Manerkar, Caroline Trippel, Daniel Lustig, Michael Pellauer, and Margaret Martonosi. 2016. Counterexamples and Proof Loophole for the C\/C++ to POWER and ARMv7 Trailing-Sync Compiler Mappings. In ArXiv, Vol. abs\/1611.01507."},{"key":"e_1_3_2_1_31_1","volume-title":"Proceedings of the 32nd ACM SIGPLAN-SIGACT Symposium on Principles of Programming Languages (POPL).","author":"Manson Jeremy","unstructured":"Jeremy Manson , William Pugh , and Sarita V. Adve . 2005. The Java Memory Model . In Proceedings of the 32nd ACM SIGPLAN-SIGACT Symposium on Principles of Programming Languages (POPL). Jeremy Manson, William Pugh, and Sarita V. Adve. 2005. The Java Memory Model. In Proceedings of the 32nd ACM SIGPLAN-SIGACT Symposium on Principles of Programming Languages (POPL)."},{"key":"e_1_3_2_1_32_1","unstructured":"Luc Maranget and Jade Alglave. 2015. Towards a Formalization of the HSA Memory Model in the cat Language. https:\/\/hal.inria.fr\/hal-01413251  Luc Maranget and Jade Alglave. 2015. Towards a Formalization of the HSA Memory Model in the cat Language. https:\/\/hal.inria.fr\/hal-01413251"},{"key":"e_1_3_2_1_33_1","unstructured":"Paul E. McKenny Alan Jeffrey Ali Sezgin and Tony Tye. 2016. P0422: Out-of-Thin-Air Execution is Vacuous. http:\/\/www.open-std.org\/jtc1\/sc22\/wg21\/docs\/papers\/2016\/p0422r0.html.  Paul E. McKenny Alan Jeffrey Ali Sezgin and Tony Tye. 2016. P0422: Out-of-Thin-Air Execution is Vacuous. http:\/\/www.open-std.org\/jtc1\/sc22\/wg21\/docs\/papers\/2016\/p0422r0.html."},{"key":"e_1_3_2_1_34_1","unstructured":"MLCommons. 2021. General MLPerf Submission Rules v0.3. https:\/\/docs.nvidia.com\/cuda\/parallel-thread-execution\/index.html  MLCommons. 2021. General MLPerf Submission Rules v0.3. https:\/\/docs.nvidia.com\/cuda\/parallel-thread-execution\/index.html"},{"key":"e_1_3_2_1_35_1","unstructured":"NVIDIA. 2017. NVIDIA Tesla V100 GPU Architecture. http:\/\/images.nvidia.com\/content\/volta-architecture\/pdf\/volta-architecture-whitepaper.pdf.  NVIDIA. 2017. NVIDIA Tesla V100 GPU Architecture. http:\/\/images.nvidia.com\/content\/volta-architecture\/pdf\/volta-architecture-whitepaper.pdf."},{"key":"e_1_3_2_1_36_1","unstructured":"NVIDIA. 2021. CUDA C++ Programming Guide. https:\/\/docs.nvidia.com\/cuda\/cuda-c-programming-guide\/index.html  NVIDIA. 2021. CUDA C++ Programming Guide. https:\/\/docs.nvidia.com\/cuda\/cuda-c-programming-guide\/index.html"},{"key":"e_1_3_2_1_37_1","unstructured":"NVIDIA. 2021. PTX ISA :: CUDA Toolkit Documentation. https:\/\/docs.nvidia.com\/cuda\/parallel-thread-execution\/index.html  NVIDIA. 2021. PTX ISA :: CUDA Toolkit Documentation. https:\/\/docs.nvidia.com\/cuda\/parallel-thread-execution\/index.html"},{"key":"e_1_3_2_1_38_1","volume-title":"Proceedings of the Twentieth International Conference on Architectural Support for Programming Languages and Operating Systems (ASPLOS).","author":"Orr Marc S.","unstructured":"Marc S. Orr , Shuai Che , Ayse Yilmazer , Bradford M. Beckmann , Mark D. Hill , and David A. Wood . 2015. Synchronization Using Remote-Scope Promotion . In Proceedings of the Twentieth International Conference on Architectural Support for Programming Languages and Operating Systems (ASPLOS). Marc S. Orr, Shuai Che, Ayse Yilmazer, Bradford M. Beckmann, Mark D. Hill, and David A. Wood. 2015. Synchronization Using Remote-Scope Promotion. In Proceedings of the Twentieth International Conference on Architectural Support for Programming Languages and Operating Systems (ASPLOS)."},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-44914-8_22"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1145\/2837614.2837616"},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.1145\/3158107"},{"key":"e_1_3_2_1_42_1","volume-title":"Francesco Zappa Nardelli, and Magnus O. Myreen","author":"Sewell Peter","year":"2010","unstructured":"Peter Sewell , Susmit Sarkar , Scott Owens , Francesco Zappa Nardelli, and Magnus O. Myreen . 2010 . X86-TSO: A Rigorous and Usable Programmer's Model for x86 Multiprocessors. In Communications of the ACM, Vol. 53 . Issue 7. Peter Sewell, Susmit Sarkar, Scott Owens, Francesco Zappa Nardelli, and Magnus O. Myreen. 2010. X86-TSO: A Rigorous and Usable Programmer's Model for x86 Multiprocessors. In Communications of the ACM, Vol. 53. Issue 7."},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-99336-8_6"},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-44914-8_23"},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"publisher","DOI":"10.1145\/2830772.2830821"},{"key":"e_1_3_2_1_46_1","volume-title":"Proceedings of the Forty-Fourth Annual International Symposium on Computer Architecture (ISCA).","author":"Sinclair Matthew D.","unstructured":"Matthew D. Sinclair , Johnathan Alsop , and Sarita V. Adve . 2017. Chasing Away RAts: Semantics and Evaluation for Relaxed Atomics on Heterogeneous Systems . In Proceedings of the Forty-Fourth Annual International Symposium on Computer Architecture (ISCA). Matthew D. Sinclair, Johnathan Alsop, and Sarita V. Adve. 2017. Chasing Away RAts: Semantics and Evaluation for Relaxed Atomics on Heterogeneous Systems. In Proceedings of the Forty-Fourth Annual International Symposium on Computer Architecture (ISCA)."},{"key":"e_1_3_2_1_47_1","volume-title":"Proceedings of the Thirty-Seventh ACM SIGPLAN Conference on Programming Language Design and Implementation (PLDI).","author":"Sorensen Tyler","unstructured":"Tyler Sorensen and Alastair F. Donaldson . 2016. Exposing Errors Related to Weak Memory in GPU Applications . In Proceedings of the Thirty-Seventh ACM SIGPLAN Conference on Programming Language Design and Implementation (PLDI). Tyler Sorensen and Alastair F. Donaldson. 2016. Exposing Errors Related to Weak Memory in GPU Applications. In Proceedings of the Thirty-Seventh ACM SIGPLAN Conference on Programming Language Design and Implementation (PLDI)."},{"key":"e_1_3_2_1_48_1","volume-title":"Proceedings of the Forty-Fourth ACM SIGPLAN Symposium on Principles of Programming Languages (POPL).","author":"Wickerson John","unstructured":"John Wickerson , Mark Batty , Tyler Sorensen , and George A. Constantinides . 2017. Automatically Comparing Memory Consistency Models . In Proceedings of the Forty-Fourth ACM SIGPLAN Symposium on Principles of Programming Languages (POPL). John Wickerson, Mark Batty, Tyler Sorensen, and George A. Constantinides. 2017. Automatically Comparing Memory Consistency Models. In Proceedings of the Forty-Fourth ACM SIGPLAN Symposium on Principles of Programming Languages (POPL)."},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"publisher","DOI":"10.1145\/3009837.3009838"}],"event":{"name":"ISCA '22: The 49th Annual International Symposium on Computer Architecture","location":"New York New York","acronym":"ISCA '22","sponsor":["SIGARCH ACM Special Interest Group on Computer Architecture","IEEE CS TCAA IEEE CS technical committee on architectural acoustics"]},"container-title":["Proceedings of the 49th Annual International Symposium on Computer Architecture"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3470496.3533045","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3470496.3533045","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T20:18:54Z","timestamp":1750191534000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3470496.3533045"}},"subtitle":["industrial product"],"short-title":[],"issued":{"date-parts":[[2022,6,11]]},"references-count":49,"alternative-id":["10.1145\/3470496.3533045","10.1145\/3470496"],"URL":"https:\/\/doi.org\/10.1145\/3470496.3533045","relation":{},"subject":[],"published":{"date-parts":[[2022,6,11]]},"assertion":[{"value":"2022-06-11","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}