{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,23]],"date-time":"2025-08-23T00:10:06Z","timestamp":1755907806069,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":29,"publisher":"ACM","license":[{"start":{"date-parts":[[2025,5,5]],"date-time":"2025-05-05T00:00:00Z","timestamp":1746403200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc\/4.0\/"}],"funder":[{"name":"Federal Ministry of Education and Research (Germany)","award":["16ME0602"],"award-info":[{"award-number":["16ME0602"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,5,5]]},"DOI":"10.1145\/3680256.3721323","type":"proceedings-article","created":{"date-parts":[[2025,5,3]],"date-time":"2025-05-03T01:00:58Z","timestamp":1746234058000},"page":"215-222","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Performance Tools for the NEC SX-Aurora Tsubasa"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-4741-7201","authenticated-orcid":false,"given":"Christian","family":"von Elm","sequence":"first","affiliation":[{"name":"CIDS, Information Services and High Performance Computing (ZIH), TU Dresden, Dresden, Germany"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-0666-4166","authenticated-orcid":false,"given":"Robert","family":"Sch\u00f6ne","sequence":"additional","affiliation":[{"name":"CIDS, Information Services and High Performance Computing (ZIH), TU Dresden, Dresden, Germany"}]}],"member":"320","published-online":{"date-parts":[[2025,5,5]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"TOP 500. 2024. TOP 500 November 2024. https:\/\/top500.org\/lists\/top500\/2024\/11\/."},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","unstructured":"P. Adamidis E. Pfister H. Bockelmann D. Zobel J.-O. Beismann and M. Jacob. 2024. The Real Challenges for Climate and Weather Modelling on its Way to Sustained Exascale Performance: A Case Study using ICON (v2.6.6). Geoscientific Model Development Discussions (2024). doi:10.5194\/gmd-2024--54","DOI":"10.5194\/gmd-2024--54"},{"volume-title":"Fortran 90 Standard (ISO\/IEC 1539 : 1991 (E))","author":"American National Standards Institute 1991.","key":"e_1_3_2_1_3_1","unstructured":"American National Standards Institute 1991. Fortran 90 Standard (ISO\/IEC 1539 : 1991 (E)). American National Standards Institute. https:\/\/wg5-fortran.org\/N001-N1100\/N692.pdf"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1007\/978--3--642--11261--4_2"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.14529\/jsfi210204"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","unstructured":"Ryusuke Egawa Souya Fujimoto Tsuyoshi Yamashita Daisuke Sasaki Yoko Isobe Yoichi Shimomura and Hiroyuki Takizawa. 2020. Exploiting the Potentials of the Second Generation SX-Aurora TSUBASA. In 2020 IEEE\/ACM Performance Modeling Benchmarking and Simulation of High Performance Computer Systems (PMBS). 39--49. doi:10.1109\/PMBS51919.2020.00010","DOI":"10.1109\/PMBS51919.2020.00010"},{"key":"e_1_3_2_1_7_1","unstructured":"Erich Focht. 2018. Testing VEOS with accelerated DMA and VE profiling. (2018). https:\/\/sx-aurora.github.io\/posts\/Testing-VEOS-DMA-prof\/"},{"key":"e_1_3_2_1_8_1","unstructured":"Erich Focht. 2018. VE monitoring with veperf. (2018). https:\/\/sx-aurora.github.io\/posts\/VE-monitoring-veperf\/"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","unstructured":"Constantino G\u00f3mez Marc Casas Filippo Mantovani and Erich Focht. 2020. Optimizing Sparse Matrix-Vector Multiplication in NEC SX-Aurora Vector Engine. doi:10.13140\/RG.2.2.24346.47042","DOI":"10.13140\/RG.2.2.24346.47042"},{"key":"e_1_3_2_1_10_1","unstructured":"Thomas Ilsche. 2020. Energy Measurements of High Performance Computing Systems: From Instrumentation to Analysis. Ph.D. Dissertation. TU Dresden. https:\/\/nbn-resolving.org\/urn:nbn:de:bsz:14-qucosa2--716000."},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1109\/CLUSTER.2017.116"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1007\/978--981--13--6624--6_9"},{"key":"e_1_3_2_1_13_1","volume-title":"Intel\u00ae VTune\u2122 Profiler User Guide","author":"Intel Corporation 2023.","year":"2023","unstructured":"Intel Corporation 2023. Intel\u00ae VTune\u2122 Profiler User Guide. Intel Corporation. https:\/\/cdrdv2.intel.com\/v1\/dl\/getContent\/773628?fileName=vtuneprofiler_user-guide_2023.1--766319--773628.pdf"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1145\/3432261.3432265"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","unstructured":"Andreas Kn\u00fcpfer Christian R\u00f6ssel Dieter an Mey Scott Biersdorff Kai Diethelm Dominic Eschweiler Markus Geimer Michael Gerndt Daniel Lorenz Allen Malony Wolfgang E. Nagel Yury Oleynik Peter Philippen Pavel Saviankou Dirk Schmidl Sameer Shende Ronny Tsch\u00fcter Michael Wagner Bert Wesarg and Felix Wolf. 2012. Score-P: A Joint Performance Measurement Run-Time Infrastructure for Periscope Scalasca TAU and Vampir. In Tools for High Performance Computing 2011. 79--91. doi:10.1007\/978--3--642--31476--6_7","DOI":"10.1007\/978--3--642--31476--6_7"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1109\/SC.2018.00057"},{"key":"e_1_3_2_1_17_1","unstructured":"Message Passing Interface Forum 2023. MPI: A Message-Passing Interface Standard Version 4.1. Message Passing Interface Forum. https:\/\/www.mpi-forum.org\/docs\/mpi-4.1\/mpi41-report.pdf"},{"key":"e_1_3_2_1_18_1","unstructured":"Siman Moll Matthias Kurtenacker Erich Focht and Sebastian Hack. 2018. NEC SX-Aurora TSUBASA and the LLVM compiler infrastructure. (2018). https:\/\/fs.hlrs.de\/projects\/teraflop\/28thWorkshop_talks\/WSSP28_SMoll_llvm-sve.pdf"},{"volume-title":"SX-Aurora TSUBASA Architecture Guide Revision 1.1","author":"NEC Corporation 2018.","key":"e_1_3_2_1_19_1","unstructured":"NEC Corporation 2018. SX-Aurora TSUBASA Architecture Guide Revision 1.1. NEC Corporation."},{"key":"e_1_3_2_1_20_1","unstructured":"NEC Corporation 2023. PROGINF\/FTRACE User's Guide (G2AT03E). NEC Corporation. https:\/\/sxauroratsubasa.sakura.ne.jp\/documents\/sdk\/pdfs\/g2at03e-PROGINF_FTRACE_User_Guide_en.pdf"},{"volume-title":"NVIDIA Nsight Systems user guide","author":"NVIDIA Corporation","key":"e_1_3_2_1_21_1","unstructured":"NVIDIA Corporation&Affiliates 2024. NVIDIA Nsight Systems user guide. NVIDIA Corporation & Affiliates. https:\/\/docs.nvidia.com\/nsight-systems\/UserGuide\/index.html"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-71058-3_8"},{"key":"e_1_3_2_1_23_1","unstructured":"Opari 2 developers 2023. Opari 2 User Manual. Opari 2 developers. https:\/\/perftools.pages.jsc.fz-juelich.de\/cicd\/opari2\/tags\/opari2--2.0.8\/pdf\/opari2.pdf"},{"key":"e_1_3_2_1_24_1","unstructured":"OpenMP Architecture Review Board 2024. OpenMP Application Programming Interface Version 6.0. OpenMP Architecture Review Board. https:\/\/www.openmp.org\/wp-content\/uploads\/OpenMP-API-Specification-6-0.pdf"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1007\/978--3--319--56702-0_4"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1177\/1094342006064482"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1007\/978--3-031--32041--5_19"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1145\/1498765.1498785"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1002\/qj.2378"}],"event":{"name":"ICPE '25: 16th ACM\/SPEC International Conference on Performance Engineering","sponsor":["SIGMETRICS ACM Special Interest Group on Measurement and Evaluation","SIGSOFT ACM Special Interest Group on Software Engineering"],"location":"Toronto ON Canada","acronym":"ICPE '25"},"container-title":["Companion of the 16th ACM\/SPEC International Conference on Performance Engineering"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3680256.3721323","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3680256.3721323","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T23:48:58Z","timestamp":1755906538000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3680256.3721323"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,5,5]]},"references-count":29,"alternative-id":["10.1145\/3680256.3721323","10.1145\/3680256"],"URL":"https:\/\/doi.org\/10.1145\/3680256.3721323","relation":{},"subject":[],"published":{"date-parts":[[2025,5,5]]},"assertion":[{"value":"2025-05-05","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}