{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,30]],"date-time":"2025-12-30T08:59:40Z","timestamp":1767085180096,"version":"3.37.3"},"reference-count":40,"publisher":"Springer Science and Business Media LLC","issue":"6-8","license":[{"start":{"date-parts":[[2018,4,30]],"date-time":"2018-04-30T00:00:00Z","timestamp":1525046400000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2018,4,30]],"date-time":"2018-04-30T00:00:00Z","timestamp":1525046400000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/100000001","name":"National Science Foundation","doi-asserted-by":"publisher","award":["1409129"],"award-info":[{"award-number":["1409129"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Vis Comput"],"published-print":{"date-parts":[[2018,6]]},"DOI":"10.1007\/s00371-018-1532-8","type":"journal-article","created":{"date-parts":[[2018,4,30]],"date-time":"2018-04-30T05:44:51Z","timestamp":1525067091000},"page":"875-885","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":17,"title":["A detailed study of ray tracing performance: render time and energy cost"],"prefix":"10.1007","volume":"34","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-8039-2977","authenticated-orcid":false,"given":"Elena","family":"Vasiou","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Konstantin","family":"Shkurko","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ian","family":"Mallett","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Erik","family":"Brunvand","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Cem","family":"Yuksel","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2018,4,30]]},"reference":[{"key":"1532_CR1","unstructured":"Aila, T., Karras, T.: Architecture considerations for tracing incoherent rays. In: Proceedings of HPG (2010)"},{"key":"1532_CR2","doi-asserted-by":"crossref","unstructured":"Aila, T., Laine, S.: Understanding the efficiency of ray traversal on GPUs. In: Proceedings of HPG (2009)","DOI":"10.1145\/1572769.1572792"},{"key":"1532_CR3","doi-asserted-by":"crossref","unstructured":"Arnau, J.M., Parcerisa, J.M., Xekalakis, P.: Eliminating redundant fragment shader executions on a mobile GPU via hardware memoization. In: Proceedings of ISCA (2014)","DOI":"10.1109\/ISCA.2014.6853207"},{"key":"1532_CR4","doi-asserted-by":"crossref","unstructured":"Bakhoda, A., Yuan, G.L., Fung, W.W.L., Wong, H., Aamodt, T.M.: Analyzing CUDA workloads using a detailed GPU simulator. In: ISPASS (2009)","DOI":"10.1109\/ISPASS.2009.4919648"},{"issue":"4","key":"1532_CR5","doi-asserted-by":"publisher","first-page":"33","DOI":"10.1145\/2601097.2601222","volume":"33","author":"R Barringer","year":"2014","unstructured":"Barringer, R., Akenine-M\u00f6ller, T.: Dynamic ray stream traversal. ACM TOG 33(4), 33 (2014)","journal-title":"ACM TOG"},{"issue":"2","key":"1532_CR6","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/2024716.2024718","volume":"39","author":"N Binkert","year":"2011","unstructured":"Binkert, N., Beckmann, B., Black, G., Reinhardt, S.K., Saidi, A., Basu, A., Hestness, J., Hower, D.R., Krishna, T., Sardashti, S., et al.: The gem5 simulator. ACM SIGARCH Comp Arch News 39(2), 1\u20137 (2011)","journal-title":"ACM SIGARCH Comp Arch News"},{"key":"1532_CR7","doi-asserted-by":"crossref","unstructured":"Boulos, S., Edwards, D., Lacewell, J.D., Kniss, J., Kautz, J., Shirley, P., Wald, I.: Packet-based Whitted and distribution ray tracing. In: Proceedings of Graphics Interface (2007)","DOI":"10.1145\/1268517.1268547"},{"key":"1532_CR8","doi-asserted-by":"crossref","unstructured":"Brunvand, E., Kopta, D., Chatterjee, N.: Why graphics programmers need to know about DRAM. In: ACM SIGGRAPH 2014 Courses (2014)","DOI":"10.1145\/2614028.2615421"},{"key":"1532_CR9","doi-asserted-by":"crossref","unstructured":"Budge, B., Bernardin, T., Stuart, J.A., Sengupta, S., Joy, K.I., Owens, J.D.: Out-of-core Data Management for Path Tracing on Hybrid Resources. CGF (2009)","DOI":"10.1111\/j.1467-8659.2009.01378.x"},{"key":"1532_CR10","unstructured":"Chatterjee, N., Balasubramonian, R., Shevgoor, M., Pugsley, S., Udipi, A., Shafiee, A., Sudan, K., Awasthi, M., Chishti, Z.: USIMM: the Utah SImulated Memory Module. Technical Report UUCS-12-02, U. of Utah (2012)"},{"key":"1532_CR11","doi-asserted-by":"crossref","unstructured":"Chatterjee, N., OConnor, M., Lee, D., Johnson, D.R., Keckler, S.W., Rhu, M., Dally, W.J.: Architecting an energy-efficient DRAM system for GPUs. In: HPCA (2017)","DOI":"10.1109\/HPCA.2017.58"},{"key":"1532_CR12","doi-asserted-by":"crossref","unstructured":"Christensen, P.H., Laur, D.M., Fong, J., Wooten, W.L., Batali, D.: Ray differentials and multiresolution geometry caching for distribution ray tracing in complex scenes. In: Eurographics (2003)","DOI":"10.1111\/1467-8659.t01-1-00702"},{"key":"1532_CR13","unstructured":"Dally, B.: The challenge of future high-performance computing. Uppsala University, Uppsala, Sweden, Celsius Lecture (2013)"},{"key":"1532_CR14","doi-asserted-by":"crossref","unstructured":"Gribble, C., Ramani, K.: Coherent ray tracing via stream filtering. In: IRT (2008)","DOI":"10.1109\/RT.2008.4634622"},{"key":"1532_CR15","doi-asserted-by":"crossref","unstructured":"Hapala, M., Davidovic, T., Wald, I., Havran, V., Slusallek, P.: Efficient stack-less BVH traversal for ray tracing. In: SCCG (2011)","DOI":"10.1145\/2461217.2461219"},{"key":"1532_CR16","unstructured":"HWRT: SimTRaX a cycle-accurate ray tracing architectural simulator and compiler. http:\/\/code.google.com\/p\/simtrax\/ (2012). Utah Hardware Ray Tracing Group"},{"key":"1532_CR17","first-page":"60","volume":"3","author":"B Johnsson","year":"2014","unstructured":"Johnsson, B., Akenine-Mller, T.: Measuring per-frame energy consumption of real-time graphics applications. JCGT 3, 60\u201373 (2014)","journal-title":"JCGT"},{"key":"1532_CR18","unstructured":"Johnsson, B., Ganestam, P., Doggett, M., Akenine-M\u00f6ller, T.: Power efficiency for software algorithms running on graphics processors. In: HPG (2012)"},{"key":"1532_CR19","doi-asserted-by":"crossref","unstructured":"Kajiya, J.T.: The rendering equation. In: Proceedings of SIGGRAPH (1986)","DOI":"10.1145\/15922.15902"},{"key":"1532_CR20","doi-asserted-by":"crossref","unstructured":"Karras, T., Aila, T.: Fast parallel construction of high-quality bounding, vol. hierarchies. In: Proceedings of HPG (2013)","DOI":"10.1145\/2492045.2492055"},{"key":"1532_CR21","doi-asserted-by":"crossref","unstructured":"Kopta, D., Shkurko, K., Spjut, J., Brunvand, E., Davis, A.: An energy and bandwidth efficient ray tracing architecture. In: Proceedings of HPG (2013)","DOI":"10.1145\/2492045.2492058"},{"issue":"1","key":"1532_CR22","first-page":"47","volume":"34","author":"D Kopta","year":"2015","unstructured":"Kopta, D., Shkurko, K., Spjut, J., Brunvand, E., Davis, A.: Memory considerations for low energy ray tracing. CGF 34(1), 47\u201359 (2015)","journal-title":"CGF"},{"key":"1532_CR23","doi-asserted-by":"crossref","unstructured":"Lee, W.J., Shin, Y., Hwang, S.J., Kang, S., Yoo, J.J., Ryu, S.: Reorder buffer: an energy-efficient multithreading architecture for hardware MIMD ray traversal. In: Proceedings of HPG (2015)","DOI":"10.1145\/2790060.2790064"},{"key":"1532_CR24","unstructured":"Liktor, G., Vaidyanathan, K.: Bandwidth-efficient BVH layout for incremental hardware traversal. In: Proceedings of HPG (2016)"},{"key":"1532_CR25","doi-asserted-by":"crossref","unstructured":"Mansson, E., Munkberg, J., Akenine-Moller, T.: Deep coherent ray tracing. In: IRT (2007)","DOI":"10.1109\/RT.2007.4342594"},{"key":"1532_CR26","doi-asserted-by":"crossref","unstructured":"Moon, B., Byun, Y., Kim, T.J., Claudio, P., Kim, H.S., Ban, Y.J., Nam, S.W., Yoon, S.E.: Cache-oblivious ray reordering. ACM Trans. Graph. 29(3), 28:1\u201328:10 (2010)","DOI":"10.1145\/1805964.1805972"},{"key":"1532_CR27","doi-asserted-by":"crossref","unstructured":"Muralimanohar, N., Balasubramonian, R., Jouppi, N.: Optimizing NUCA organizations and wiring alternatives for large caches with CACTI 6.0. In: MICRO (2007)","DOI":"10.1109\/MICRO.2007.33"},{"key":"1532_CR28","doi-asserted-by":"crossref","unstructured":"Navr\u00e1til, P., Fussell, D., Lin, C., Mark, W.: Dynamic ray scheduling to improve ray coherence and bandwidth utilization. In: IRT (2007)","DOI":"10.1109\/RT.2007.4342596"},{"key":"1532_CR29","unstructured":"Navr\u00e1til, P.A., Mark, W.R.: An analysis of ray tracing bandwidth consumption. University of Texas at Austin, Computer Science Department (2006)"},{"key":"1532_CR30","doi-asserted-by":"crossref","unstructured":"Overbeck, R., Ramamoorthi, R., Mark, W.R.: Large ray packets for real-time Whitted ray tracing. In: IRT (2008)","DOI":"10.1109\/RT.2008.4634619"},{"key":"1532_CR31","unstructured":"Pool, J.: Energy-precision tradeoffs in the graphics pipeline. Ph.D. thesis, UNC, Chapel Hill (2012)"},{"key":"1532_CR32","doi-asserted-by":"crossref","unstructured":"Pool, J., Lastra, A., Singh, M.: An energy model for graphics processing units. In: ICCD (2010)","DOI":"10.1109\/ICCD.2010.5647678"},{"key":"1532_CR33","doi-asserted-by":"crossref","unstructured":"Shkurko, K., Grant, T., Kopta, D., Mallett, I., Yuksel, C., Brunvand, E.: Dual streaming for hardware-accelerated ray tracing. In: Proceedings of HPG (2017)","DOI":"10.1145\/3105762.3105771"},{"key":"1532_CR34","doi-asserted-by":"crossref","unstructured":"Smits, B.: Efficiency issues for ray tracing. In: SIGGRAPH Courses, SIGGRAPH \u201905 (2005)","DOI":"10.1145\/1198555.1198745"},{"key":"1532_CR35","unstructured":"Spjut, J., Kensler, A., Kopta, D., Brunvand, E.: TRaX: A multicore hardware architecture for real-time ray tracing. IEEE Trans. CAD 28(12), 1802\u20131815 (2009)"},{"key":"1532_CR36","doi-asserted-by":"crossref","unstructured":"Spjut, J., Kopta, D., Boulos, S., Kellis, S., Brunvand, E.: TRaX: A multi-threaded architecture for real-time ray tracing. In: SASP (2008)","DOI":"10.1109\/SASP.2008.4570794"},{"key":"1532_CR37","doi-asserted-by":"crossref","unstructured":"Tsakok, J.A.: Faster incoherent rays: Multi-BVH ray stream tracing. In: Proceedings of HPG (2009)","DOI":"10.1145\/1572769.1572793"},{"key":"1532_CR38","doi-asserted-by":"crossref","unstructured":"Vogelsang, T.: Understanding the energy consumption of dynamic random access memories. In: MICRO \u201943 (2010)","DOI":"10.1109\/MICRO.2010.42"},{"key":"1532_CR39","doi-asserted-by":"crossref","unstructured":"Wang, R., Yu, B., Marco, J., Hu, T., Gutierrez, D., Bao, H.: Real-time rendering on a power budget. ACM TOG 35(4), 111:1\u2013111:11 (2016)","DOI":"10.1145\/2897824.2925889"},{"key":"1532_CR40","doi-asserted-by":"crossref","unstructured":"Whitted, T.: An improved illumination model for shaded display. Com. ACM 23(6), 343\u2013349 (1980)","DOI":"10.1145\/358876.358882"}],"container-title":["The Visual Computer"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s00371-018-1532-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-018-1532-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s00371-018-1532-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,9,2]],"date-time":"2023-09-02T10:04:59Z","timestamp":1693649099000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s00371-018-1532-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2018,4,30]]},"references-count":40,"journal-issue":{"issue":"6-8","published-print":{"date-parts":[[2018,6]]}},"alternative-id":["1532"],"URL":"https:\/\/doi.org\/10.1007\/s00371-018-1532-8","relation":{},"ISSN":["0178-2789","1432-2315"],"issn-type":[{"type":"print","value":"0178-2789"},{"type":"electronic","value":"1432-2315"}],"subject":[],"published":{"date-parts":[[2018,4,30]]},"assertion":[{"value":"30 April 2018","order":1,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Compliance with Ethical Standards"}},{"value":"The authors, Elena Vasiou, Konstantin Shkurko, Ian Mallett, Erik Brunvand, and Cem Yuksel, declare that they have no conflict of interest relating to this work and publication.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}