{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,5]],"date-time":"2026-03-05T15:33:13Z","timestamp":1772724793929,"version":"3.50.1"},"reference-count":28,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2014,2]]},"DOI":"10.1109\/hpca.2014.6835930","type":"proceedings-article","created":{"date-parts":[[2014,7,28]],"date-time":"2014-07-28T14:48:01Z","timestamp":1406558881000},"page":"189-200","source":"Crossref","is-referenced-by-count":45,"title":["QuickRelease: A throughput-oriented approach to release consistency on GPUs"],"prefix":"10.1109","author":[{"given":"Blake A.","family":"Hechtman","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shuai","family":"Che","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Derek R.","family":"Hower","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yingying","family":"Tian","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Bradford M.","family":"Beckmann","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mark D.","family":"Hill","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Steven K.","family":"Reinhardt","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"David A.","family":"Wood","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"19","first-page":"159","article-title":"Scalable store-load for-warding via store queue index prediction","author":"sha","year":"2005","journal-title":"Micro"},{"key":"17","doi-asserted-by":"publisher","DOI":"10.1109\/2.121510"},{"key":"18","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2010.31"},{"key":"15","year":"0","journal-title":"Standards"},{"key":"16","doi-asserted-by":"publisher","DOI":"10.2200\/S00346ED1V01Y201104CAC016"},{"key":"13","year":"2002","journal-title":"A Formal Specification of Intel\ufffd Itanium\ufffd Processor Family Memory Ordering"},{"key":"14","first-page":"180","article-title":"From causal consistency to sequential consistency in shared memory systems","author":"raynal","year":"1995","journal-title":"FST&TCS"},{"key":"11","doi-asserted-by":"publisher","DOI":"10.1109\/MC.2005.239"},{"key":"12","year":"1999","journal-title":"Alpha 21264 Microprocessor Hardware Reference Manual"},{"key":"21","doi-asserted-by":"publisher","DOI":"10.1109\/PACT.2005.11"},{"key":"20","article-title":"Mechanisms for store-wait-free multiprocessors","author":"thomas","year":"2007","journal-title":"ISCA"},{"key":"22","doi-asserted-by":"publisher","DOI":"10.1145\/2541940.2541981"},{"key":"23","doi-asserted-by":"publisher","DOI":"10.1145\/2024716.2024718"},{"key":"24","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2012.2"},{"key":"25","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2007.43"},{"key":"26","year":"2013","journal-title":"Accelerated Parallel Processing (APP) SDK"},{"key":"27","doi-asserted-by":"publisher","DOI":"10.1145\/2188286.2188341"},{"key":"28","doi-asserted-by":"publisher","DOI":"10.1145\/2485922.2485964"},{"key":"3","doi-asserted-by":"publisher","DOI":"10.1109\/IISWC.2009.5306797"},{"key":"2","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA.2013.6522351"},{"key":"10","doi-asserted-by":"publisher","DOI":"10.1109\/2.546611"},{"key":"1","year":"0","journal-title":"An Introduction to the HAS Intermediate Lan-guage"},{"key":"7","year":"2012","journal-title":"NVIDIA NVIDIA's Next Generation CUDA Computer Architecture Kepler GK110"},{"key":"6","doi-asserted-by":"publisher","DOI":"10.1145\/1375527.1375528"},{"key":"5","author":"munshi","year":"2008","journal-title":"OpenCL \" Parallel Computing on the GPU and CPU SIGGRAPH"},{"key":"4","doi-asserted-by":"publisher","DOI":"10.1145\/2485922.2485940"},{"key":"9","article-title":"AFDS 2011 phil rogers keynote","author":"foundation","year":"0","journal-title":"The Pro-grammer's Guide to the APU"},{"key":"8","year":"2012","journal-title":"Southern Islands Series Instruction Set Architecture"}],"event":{"name":"2014 IEEE 20th International Symposium on High Performance Computer Architecture (HPCA)","location":"Orlando, FL, USA","start":{"date-parts":[[2014,2,15]]},"end":{"date-parts":[[2014,2,19]]}},"container-title":["2014 IEEE 20th International Symposium on High Performance Computer Architecture (HPCA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6823235\/6835920\/06835930.pdf?arnumber=6835930","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,3,23]],"date-time":"2017-03-23T18:21:57Z","timestamp":1490293317000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/6835930\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014,2]]},"references-count":28,"URL":"https:\/\/doi.org\/10.1109\/hpca.2014.6835930","relation":{},"subject":[],"published":{"date-parts":[[2014,2]]}}}