{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,27]],"date-time":"2026-03-27T17:08:53Z","timestamp":1774631333707,"version":"3.50.1"},"reference-count":53,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"6","license":[{"start":{"date-parts":[[2020,6,1]],"date-time":"2020-06-01T00:00:00Z","timestamp":1590969600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Parallel Distrib. Syst."],"published-print":{"date-parts":[[2020,6,1]]},"DOI":"10.1109\/tpds.2019.2960333","type":"journal-article","created":{"date-parts":[[2019,12,18]],"date-time":"2019-12-18T20:45:41Z","timestamp":1576701941000},"page":"1316-1327","source":"Crossref","is-referenced-by-count":27,"title":["SLEEF: A Portable Vectorized Library of C Standard Mathematical Functions"],"prefix":"10.1109","volume":"31","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9430-5555","authenticated-orcid":false,"given":"Naoki","family":"Shibata","sequence":"first","affiliation":[{"name":"Graduate School of Information Science, Nara Institute of Science and Technology, Nara, Japan"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8375-3638","authenticated-orcid":false,"given":"Francesco","family":"Petrogalli","sequence":"additional","affiliation":[{"name":"ARM 110, Cambridge, United Kingdom"}]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/ISPASS.2006.1620789"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2016.25"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/CGO.2004.1281665"},{"key":"ref32","year":"2004"},{"key":"ref31","article-title":"Arm compiler for HPC","year":"0"},{"key":"ref30","article-title":"GCC, the GNU compiler collection","year":"1984"},{"key":"ref37","article-title":"Vector function application binary interface","author":"tian","year":"2015"},{"key":"ref36","first-page":"62","article-title":"Extending OpenMP SIMD support for target specific code and application to ARM SVE","author":"lee","year":"2017","journal-title":"Proceedings of the International Workshop on OpenMP"},{"key":"ref35","article-title":"OpenMP application program interface","year":"2013"},{"key":"ref34","article-title":"Vector function application binary interface specification for AArch64","year":"2018"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1145\/1133981.1133997"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1145\/359327.359336"},{"key":"ref29","first-page":"36","article-title":"Intel OpenMP C++\/fortran compiler for hyper-threading technology: Implementation and performance","volume":"6","author":"tian","year":"2002","journal-title":"Intel Technol J"},{"key":"ref2","first-page":"105","article-title":"Autovectorization in GCC","author":"naishlos","year":"2004","journal-title":"Proc GCC Developers Summit"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/CAMP.2000.875989"},{"key":"ref20","year":"2014","journal-title":"ARM NEON Intrinsics Reference"},{"key":"ref22","article-title":"ARM C language extensions for SVE documentation","year":"2017"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1007\/978-1-4757-2646-6"},{"key":"ref24","author":"muller","year":"2009","journal-title":"Handbook of Floating-Point Arithmetic"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.5194\/gmdd-8-4375-2015"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/CGO.2011.5764683"},{"key":"ref25","article-title":"Auto-vectorization techniques for modern SIMD architectures","author":"krzikalla","year":"2012","journal-title":"Proc Workshop Compilers for Parallel Computers"},{"key":"ref50","first-page":"28","article-title":"Sollya: An environment for the development of numerical codes","author":"chevillard","year":"2010","journal-title":"Proceedings of the 2nd International Congress on Mathematical Software"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1145\/1460361.1460365"},{"key":"ref53","article-title":"Boost Software License 1.0 (BSL-1.0)","author":"abrahams","year":"2003"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1007\/s00450-010-0108-2"},{"key":"ref10","article-title":"AMD core math library","year":"2013"},{"key":"ref11","article-title":"Libmvec in glibc","year":"2015"},{"key":"ref40","article-title":"Intel 64 and IA-32 architectures optimization reference manual","year":"2016"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TC.2008.223"},{"key":"ref13","article-title":"Yeppp! library","author":"dukhan","year":"2013"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-55224-3_9"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1088\/1742-6596\/513\/5\/052027"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1145\/2990194"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/HPCSim.2016.7568423"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA.2007.346199"},{"key":"ref19","doi-asserted-by":"crossref","first-page":"65","DOI":"10.1145\/2370036.2145825","article-title":"Extending a c-like language for portable SIMD programming","volume":"47","author":"lei\u00dfa","year":"2012","journal-title":"ACM SIGPLAN Notices"},{"key":"ref4","article-title":"Sun freely distributable libm version 5.3.","year":"2010"},{"key":"ref3","article-title":"Intel short vector math library","year":"2019"},{"key":"ref6","year":"2011"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ACSSC.2016.7869070"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1145\/103147.103151"},{"key":"ref7","article-title":"The GNU C library (glibc)","year":"2018"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1007\/3-540-12868-9_95"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1117\/12.505591"},{"key":"ref46","article-title":"Software manual for the elementary functions","author":"cody","year":"1980"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1007\/PL00009321"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1145\/1057600.1057602"},{"key":"ref47","first-page":"24","article-title":"Implementation and testing of function software","author":"cody","year":"1980","journal-title":"Proc Problems Methodologies Math Softw Prod"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1145\/3297858.3304062"},{"key":"ref41","article-title":"Instruction tables: Lists of instruction latencies, throughputs and micro-operation breakdowns for Intel, AMD and VIA CPUs","author":"fog","year":"0"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1007\/BF01397083"},{"key":"ref43","article-title":"llvm-exegesis: Automatic measurement of instruction latency\/uops","year":"2018"}],"container-title":["IEEE Transactions on Parallel and Distributed Systems"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/71\/8965249\/08936472.pdf?arnumber=8936472","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,15]],"date-time":"2025-01-15T20:20:09Z","timestamp":1736972409000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8936472\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,6,1]]},"references-count":53,"journal-issue":{"issue":"6"},"URL":"https:\/\/doi.org\/10.1109\/tpds.2019.2960333","relation":{},"ISSN":["1045-9219","1558-2183","2161-9883"],"issn-type":[{"value":"1045-9219","type":"print"},{"value":"1558-2183","type":"electronic"},{"value":"2161-9883","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,6,1]]}}}