{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,1]],"date-time":"2025-11-01T09:14:35Z","timestamp":1761988475043,"version":"3.40.3"},"publisher-location":"Berlin, Heidelberg","reference-count":24,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783642309601"},{"type":"electronic","value":"9783642309618"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2012]]},"DOI":"10.1007\/978-3-642-30961-8_5","type":"book-chapter","created":{"date-parts":[[2012,5,22]],"date-time":"2012-05-22T17:44:50Z","timestamp":1337708690000},"page":"59-72","source":"Crossref","is-referenced-by-count":21,"title":["Extending OpenMP* with Vector Constructs for Modern Multicore SIMD Architectures"],"prefix":"10.1007","author":[{"given":"Michael","family":"Klemm","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Alejandro","family":"Duran","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xinmin","family":"Tian","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hideki","family":"Saito","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Diego","family":"Caballero","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xavier","family":"Martorell","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","reference":[{"issue":"5","key":"5_CR1","doi-asserted-by":"publisher","first-page":"67","DOI":"10.1145\/1941487.1941507","volume":"54","author":"S. Borkar","year":"2011","unstructured":"Borkar, S., Chien, A.A.: The Future of Microprocessors. Communications of the ACM\u00a054(5), 67\u201377 (2011)","journal-title":"Communications of the ACM"},{"key":"5_CR2","unstructured":"Caballero, D.L.: User-directed Vectorization in OmpSs. Master\u2019s thesis, Universitat Polit\u00e8cnica de Catalunya, Barcelona, Spain (September 2011)"},{"key":"5_CR3","unstructured":"Barcelona Supercomputing Center. The NANOS Group Site: The Mercurium Compiler, http:\/\/nanos.ac.upc.edu\/mcxx"},{"issue":"6","key":"5_CR4","doi-asserted-by":"publisher","first-page":"398","DOI":"10.1016\/j.micpro.2006.02.011","volume":"30","author":"M. Omer Cheema","year":"2006","unstructured":"Omer Cheema, M., Hammami, O.: Application-specific SIMD Synthesis for Reconfigurable Architectures. Microprocessors and Microsystems\u00a030(6), 398\u2013412 (2006)","journal-title":"Microprocessors and Microsystems"},{"key":"5_CR5","doi-asserted-by":"crossref","unstructured":"Eichenberger, A.E., Wu, P., O\u2019Brien, K.: Vectorization for SIMD Architectures with Alignment Constraints. In: Proc. of the ACM SIGPLAN 2004 Conf. on Programming Language Design and Implementation, Washington, D.C, pp. 82\u201393 (June 2004)","DOI":"10.1145\/996841.996853"},{"key":"5_CR6","unstructured":"Free Software Foundation Inc. GCC 4.7 Release Series (March 2012), http:\/\/gcc.gnu.org\/gcc-4.7\/"},{"key":"5_CR7","doi-asserted-by":"crossref","unstructured":"Heinecke, A., Klemm, M., Bungartz, H.-J.: From GPGPUs to Many-Core: NVIDIA Fermi* and Intel\u00ae Many Integrated Core Architecture. Computing in Science and Engineering (to appear, 2012)","DOI":"10.1109\/MCSE.2012.23"},{"key":"5_CR8","doi-asserted-by":"crossref","unstructured":"Heinecke, A., Pfl\u00fcger, D.: Multi- and many-core data mining with adaptive sparse grids. In: Proc. of the 8th ACM Intl. Conf. on Computing Frontiers, New York, pp. 29:1\u201329:10 (May 2011)","DOI":"10.1145\/2016604.2016640"},{"key":"5_CR9","unstructured":"Intel Corporation. Intel\u00ae Advanced Vector Extensions Programming Reference, Document number 319433-011 (June 2011)"},{"key":"5_CR10","doi-asserted-by":"crossref","unstructured":"Karrenberg, R., Hack, S.: Whole-Function Vectorization. In: Proc. of the 9th Intl. Ann. IEEE\/ACM Symp. on Code Generation and Optimization, Charmonix, France, pp. 141\u2013150 (April 2011)","DOI":"10.1109\/CGO.2011.5764682"},{"key":"5_CR11","unstructured":"Khronos OpenCL Working Group. The OpenCL Specification (February 2009), http:\/\/www.khronos.org\/registry\/cl\/"},{"key":"5_CR12","unstructured":"Krzikalla, O., Feldhoff, K., M\u00fcller-Pfefferkorn, R., Nagel, W.E.: Auto-Vectorization Techniques for Modern SIMD Architectures. In: Proc. of the 16th Workshop on Compilers for Parallel Computing, Padova, Italy (January 2012)"},{"key":"5_CR13","doi-asserted-by":"crossref","unstructured":"Larsen, S., Amarasinghe, S.: Exploiting Superword Level Parallelism with Multimedia Instruction Sets. In: Proc. of the ACM SIGPLAN 2000 Conf. on Programming Language Design and Implementation, Vancouver, BC, Canada, pp. 145\u2013156 (June 2000)","DOI":"10.1145\/358438.349320"},{"key":"5_CR14","doi-asserted-by":"crossref","unstructured":"Maleki, S., Gao, Y., Garzar\u00e1n, M.J., Wong, T., Padua, D.A.: An Evaluation of Vectorizing Compilers. In: Proc. of the 2011 Intl. Conf. on Parallel Architectures and Compilation Techniques, Galveston Island, TX, pp. 372\u2013382 (October 2011)","DOI":"10.1109\/PACT.2011.68"},{"key":"5_CR15","doi-asserted-by":"crossref","unstructured":"Naishlos, D., Biberstein, M., Ben-David, S., Zaks, A.: Vectorizing for a SIMdD DSP architecture. In: Proc. of the 2003 Intl. Conf. on Compilers, Architecture and Synthesis for Embedded Systems, San Jose, CA, pp. 2\u201311 (October 2003)","DOI":"10.1145\/951710.951714"},{"key":"5_CR16","unstructured":"Naishlos, D., Biberstein, M., Zaks, A.: Compiler Vectorization Techniques for a Disjoint SIMD Architecture. Technical Report H-0146, IBM Research Division, Haifa, Israel (November 2002)"},{"key":"5_CR17","doi-asserted-by":"crossref","unstructured":"Nuzman, D., Henderson, R.: Multi-platform Auto-vectorization. In: Proc. of the 4th Ann. IEEE\/ACM Intl. Symp. on Code Generation and Optimization, New York, pp. 281\u2013294 (March 2006)","DOI":"10.1109\/CGO.2006.25"},{"key":"5_CR18","doi-asserted-by":"crossref","unstructured":"Nuzman, D., Rosen, I., Zaks, A.: Auto-vectorization of Interleaved Data for SIMD. In: Proc. of the 2006 ACM SIGPLAN Conf. on Programming Language Design and Implementation, Ottawa, ON, Canada, pp. 132\u2013143 (June 2006)","DOI":"10.1145\/1133981.1133997"},{"key":"5_CR19","doi-asserted-by":"crossref","unstructured":"Nuzman, D., Zaks, A.: Outer-loop Vectorization: Revisited for Short SIMD Architectures. In: Proc. of the 17th Intl. Conf. on Parallel Architectures and Compilation Techniques, Toronto, ON, Canada, pp. 2\u201311 (October 2008)","DOI":"10.1145\/1454115.1454119"},{"key":"5_CR20","unstructured":"OpenMP Architecture Review Board. OpenMP Application Program Interface, Version 3.1 (July 2011), http:\/\/www.openmp.org\/"},{"key":"5_CR21","doi-asserted-by":"crossref","unstructured":"Sutter, H.: The Free Lunch Is Over\u2014A Fundamental Turn Toward Concurrency in Software. Dr. Dobb\u2019s Journal\u00a030(3) (March 2005)","DOI":"10.1145\/1095408.1095421"},{"key":"5_CR22","unstructured":"Tian, X., Saito, H., Preis, S.V., Kozhukhov, S.S., Cherkasov, A.G., Nelson, C., Panchenko, N., Geva, R.: Compiling C\/C++ SIMD Extensions for Function and Loop Vectorization on Multicore-SIMD Processors. In: Multicore and GPU Programming Models, Languages and Compilers Workshop (Submitted for peer review)"},{"key":"5_CR23","unstructured":"Wu, P., Eichenberger, A.E., Wang, A.: Efficient SIMD Code Generation for Runtime Alignment and Length Conversion. In: Proc. of the 3rd Ann. IEEE\/ACM Intl. Symp. on Code Generation and Optimization, Jan Jose, CA, pp. 153\u2013164 (March 2005)"},{"key":"5_CR24","doi-asserted-by":"crossref","unstructured":"Wu, P., Eichenberger, A.E., Wang, A., Zhao, P.: An Integrated Simdization Framework Using Virtual Vectors. In: Proc. of the 19th Annual Intl. Conf. on Supercomputing, Boston, MA, USA, pp. 169\u2013178 (June 2005)","DOI":"10.1145\/1088149.1088172"}],"container-title":["Lecture Notes in Computer Science","OpenMP in a Heterogeneous World"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-642-30961-8_5.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,3,28]],"date-time":"2025-03-28T15:09:05Z","timestamp":1743174545000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-642-30961-8_5"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2012]]},"ISBN":["9783642309601","9783642309618"],"references-count":24,"URL":"https:\/\/doi.org\/10.1007\/978-3-642-30961-8_5","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2012]]}}}