{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,28]],"date-time":"2025-09-28T15:35:41Z","timestamp":1759073741780,"version":"3.44.0"},"publisher-location":"Cham","reference-count":24,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031998539"},{"type":"electronic","value":"9783031998546"}],"license":[{"start":{"date-parts":[[2025,8,27]],"date-time":"2025-08-27T00:00:00Z","timestamp":1756252800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,8,27]],"date-time":"2025-08-27T00:00:00Z","timestamp":1756252800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026]]},"DOI":"10.1007\/978-3-031-99854-6_4","type":"book-chapter","created":{"date-parts":[[2025,8,26]],"date-time":"2025-08-26T05:09:55Z","timestamp":1756184995000},"page":"54-70","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["THAPI: Tracing Heterogeneous APIs"],"prefix":"10.1007","author":[{"given":"Solomon","family":"Bekele","sequence":"first","affiliation":[]},{"given":"Aurelio","family":"Vivas","sequence":"additional","affiliation":[]},{"given":"Thomas","family":"Applencourt","sequence":"additional","affiliation":[]},{"given":"Servesh","family":"Muralidharan","sequence":"additional","affiliation":[]},{"given":"Bryce","family":"Allen","sequence":"additional","affiliation":[]},{"given":"Kazutomo","family":"Yoshii","sequence":"additional","affiliation":[]},{"given":"Swann","family":"Perarnau","sequence":"additional","affiliation":[]},{"given":"Brice","family":"Videau","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,8,27]]},"reference":[{"key":"4_CR1","unstructured":"AMD OmniTrace. https:\/\/rocm.docs.amd.com\/projects\/omnitrace\/en\/latest\/doxygen\/html\/index.html. Accessed Mar 2025"},{"key":"4_CR2","unstructured":"Babeltrace2. https:\/\/babeltrace.org\/docs\/v2.0\/man1\/babeltrace2.1\/. Accessed 20 Jul 2024"},{"key":"4_CR3","unstructured":"Intel VTune Profiler. https:\/\/www.intel.com\/content\/www\/us\/en\/docs\/vtune-profiler\/installation-guide\/2025-0\/overview.html"},{"key":"4_CR4","unstructured":"AMD: ROC Profiler. https:\/\/rocm.docs.amd.com\/projects\/rocprofiler\/en\/docs-5.5.1\/rocprof.html. Accessed 20 Jul 2024"},{"key":"4_CR5","unstructured":"AMD: Hip programming guide (2025). https:\/\/rocm.docs.amd.com\/projects\/HIP\/en\/latest\/understand\/programming_model.html. Accessed 20 Feb 2025"},{"key":"4_CR6","doi-asserted-by":"publisher","unstructured":"Babej, M., et\u00a0al.: HIPCL: Tool for porting cuda applications to advanced openCL platforms through HIP. In: IWOCL 2020. ACM, New York, NY, USA (2020). https:\/\/doi.org\/10.1145\/3388333.3388641","DOI":"10.1145\/3388333.3388641"},{"key":"4_CR7","doi-asserted-by":"publisher","unstructured":"Boehme, D., et\u00a0al.: Caliper: Performance introspection for HPC software stacks. In: SC\u201916, pp. 550\u2013560 (2016). https:\/\/doi.org\/10.1109\/SC.2016.46","DOI":"10.1109\/SC.2016.46"},{"issue":"1","key":"4_CR8","doi-asserted-by":"publisher","DOI":"10.1155\/2015\/940628","volume":"2015","author":"D Couturier","year":"2015","unstructured":"Couturier, D., Dagenais, M.R.: Lttng CLUST: A system-wide unified CPU and GPU tracing tool for openCL applications. Adv. Softw. Eng. 2015(1), 940628 (2015). https:\/\/doi.org\/10.1155\/2015\/940628","journal-title":"Adv. Softw. Eng."},{"key":"4_CR9","unstructured":"Desnoyers, M., Dagenais, M.R.: The LTTng Tracer: A low impact performance and behavior monitor for GNU\/Linux. In: Proceedings of the Ottawa Linux Symposium (2006). https:\/\/api.semanticscholar.org\/CorpusID:11300732"},{"key":"4_CR10","unstructured":"Fournier, P.M., de\u00a0Montr\u00e9al, \u00c9.P., Desnoyers, M., Dagenais, M.R.: Combined tracing of the kernel and applications with LTTng (2010). https:\/\/api.semanticscholar.org\/CorpusID:215820229"},{"key":"4_CR11","unstructured":"Google: Perfetto: Performance instrumentation and tracing. https:\/\/perfetto.dev (2024)"},{"key":"4_CR12","unstructured":"Intel: Profiling tools interfaces for GPU. https:\/\/github.com\/intel\/pti-gpu. Accessed Mar 2025"},{"key":"4_CR13","doi-asserted-by":"publisher","unstructured":"Jin, Z., Vetter, J.S.: A benchmark suite for improving performance portability of the sycl programming model. In: ISPASS 2023, pp. 325\u2013327 (2023). https:\/\/doi.org\/10.1109\/ISPASS57527.2023.00041","DOI":"10.1109\/ISPASS57527.2023.00041"},{"key":"4_CR14","doi-asserted-by":"crossref","unstructured":"Kn\u00fcpfer, A., R\u00f6ssel, et\u00a0al, C.: Score-p: A joint performance measurement run-time infrastructure for periscope,scalasca, tau, and vampir. In: Tools for High Performance Computing 2011, pp. 79\u201391. Springer Berlin Heidelberg, Berlin, Heidelberg (2012)","DOI":"10.1007\/978-3-642-31476-6_7"},{"key":"4_CR15","doi-asserted-by":"publisher","unstructured":"Li, e.a.: Spechpc 2021 benchmark suites for modern HPC systems, pp. 15\u201316. ICPE \u201922, ACM, New York, NY, USA (2022). https:\/\/doi.org\/10.1145\/3491204.3527498","DOI":"10.1145\/3491204.3527498"},{"issue":"17","key":"4_CR16","doi-asserted-by":"publisher","DOI":"10.1002\/cpe.5231","volume":"31","author":"P Margheritta","year":"2019","unstructured":"Margheritta, P., Dagenais, M.R.: LTTng-HSA: Bringing LTTng tracing to HSA-based GPU runtimes. Concurrency Comput. Prac. Experience 31(17), e5231 (2019). https:\/\/doi.org\/10.1002\/cpe.5231","journal-title":"Concurrency Comput. Prac. Experience"},{"key":"4_CR17","doi-asserted-by":"crossref","unstructured":"Nickolls, J., Buck, I., Garland, M., Skadron, K.: Scalable parallel programming with cuda. ACM Queue 6(2), 40\u201353 (2008). http:\/\/dblp.uni-trier.de\/db\/journals\/queue\/queue6.html","DOI":"10.1145\/1365490.1365500"},{"key":"4_CR18","unstructured":"NVIDIA: Nsight Compute. https:\/\/developer.nvidia.com\/nsight-compute. Accessed 20 Jul 2024"},{"key":"4_CR19","doi-asserted-by":"publisher","unstructured":"Reyes, R.e.a.: Sycl 2020: More than meets the eye. In: Proceedings of the International Workshop on OpenCL. IWOCL \u201920, ACM, New York, NY, USA (2020). https:\/\/doi.org\/10.1145\/3388333.3388649","DOI":"10.1145\/3388333.3388649"},{"issue":"2","key":"4_CR20","doi-asserted-by":"publisher","first-page":"287","DOI":"10.1177\/1094342006064482","volume":"20","author":"SS Shende","year":"2006","unstructured":"Shende, S.S., Malony, A.D.: The tau parallel performance system. Int. J. High Perform. Comput. Appl. 20(2), 287\u2013311 (2006). https:\/\/doi.org\/10.1177\/1094342006064482","journal-title":"Int. J. High Perform. Comput. Appl."},{"key":"4_CR21","doi-asserted-by":"publisher","unstructured":"Tallent, N., Mellor-Crummey, J., Adhianto, L., Fagan, M., Krentel, M.: HPCToolkit: performance tools for scientific computing. J. Phys. Conf. Ser. 125(1), 012088 (2008). https:\/\/doi.org\/10.1088\/1742-6596\/125\/1\/012088","DOI":"10.1088\/1742-6596\/125\/1\/012088"},{"key":"4_CR22","unstructured":"The TOP500 project : Top500 lists. https:\/\/top500.org\/lists\/top500\/2024\/06\/"},{"issue":"4","key":"4_CR23","doi-asserted-by":"publisher","first-page":"805","DOI":"10.1109\/TPDS.2021.3097283","volume":"33","author":"CR Trott","year":"2022","unstructured":"Trott, C.R., Lebrun-Grandi\u00e9, D., et al.: Kokkos 3: Programming model extensions for the exascale era. IEEE Trans. Parallel Distrib. Syst. 33(4), 805\u2013817 (2022). https:\/\/doi.org\/10.1109\/TPDS.2021.3097283","journal-title":"IEEE Trans. Parallel Distrib. Syst."},{"issue":"25","key":"4_CR24","doi-asserted-by":"publisher","DOI":"10.1002\/cpe.7866","volume":"35","author":"J Zhao","year":"2023","unstructured":"Zhao, J., Bertoni, C., Young, J., Harms, K., Sarkar, V., Videau, B.: HIPLZ: Enabling performance portability for exascale systems. Concurrency Comput. Prac. Experience 35(25), e7866 (2023). https:\/\/doi.org\/10.1002\/cpe.7866","journal-title":"Concurrency Comput. Prac. Experience"}],"container-title":["Lecture Notes in Computer Science","Euro-Par 2025: Parallel Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-99854-6_4","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,3]],"date-time":"2025-09-03T09:43:48Z","timestamp":1756892628000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-99854-6_4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,8,27]]},"ISBN":["9783031998539","9783031998546"],"references-count":24,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-99854-6_4","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2025,8,27]]},"assertion":[{"value":"27 August 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"The authors have no competing interests to declare that are relevant to the content of this article","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Disclosure of Interests"}},{"value":"Euro-Par","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Parallel Processing","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Dresden","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Germany","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"25 August 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 August 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"31","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"europar2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/2025.euro-par.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}