{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,5]],"date-time":"2024-09-05T01:55:33Z","timestamp":1725501333709},"publisher-location":"Berlin, Heidelberg","reference-count":18,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540775591"},{"type":"electronic","value":"9783540775607"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"DOI":"10.1007\/978-3-540-77560-7_4","type":"book-chapter","created":{"date-parts":[[2008,1,17]],"date-time":"2008-01-17T06:13:02Z","timestamp":1200550382000},"page":"38-52","source":"Crossref","is-referenced-by-count":10,"title":["Modeling Multigrain Parallelism on Heterogeneous Multi-core Processors: A Case Study of the Cell BE"],"prefix":"10.1007","author":[{"given":"Filip","family":"Blagojevic","sequence":"first","affiliation":[]},{"given":"Xizhou","family":"Feng","sequence":"additional","affiliation":[]},{"given":"Kirk W.","family":"Cameron","sequence":"additional","affiliation":[]},{"given":"Dimitrios S.","family":"Nikolopoulos","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"4_CR1","unstructured":"IBM Corporation. Cell Broadband Engine Architecture, Version 1.01. Technical report, (October 2006)"},{"key":"4_CR2","unstructured":"Fahey, M., Alam, S., Dunigan, T., Vetter, J., Worley, P.: Early Evaluation of the Cray XD1. In: Proc. of the 2005 Cray Users Group Meeting (2005)"},{"key":"4_CR3","unstructured":"Starbridge Systems. A Reconfigurable Computing Model for Biological Research: Application of Smith-Waterman Analysis to Bacterial Genomes. Technical report (2005)"},{"key":"4_CR4","unstructured":"Chamberlain, R., Miller, S., White, J., Gall, D.: Highly-Scalable Recondigurable Computing. In: Proc. of the 2005 MAPLD International Conference, Washington, DC (September 2005)"},{"key":"4_CR5","doi-asserted-by":"crossref","unstructured":"Blagojevic, F., Nikolopoulos, D., Stamatakis, A., Antonopoulos, C.: Dynamic Multigrain Parallelization on the Cell Broadband Engine. In: Proc. of the 2007 ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming, San Jose, CA, pp. 90\u2013100 (March 2007)","DOI":"10.1145\/1229428.1229445"},{"key":"4_CR6","doi-asserted-by":"crossref","unstructured":"Culler, D., Karp, R., Patterson, D., Sahay, A., Scauser, K., Santos, E., Subramonian, R., Von Eicken, T.: LogP: Towards a Realistic Model of Parallel Computation. In: PPoPP 1993. Proc. of the 4th ACM SIGPLAN Symposium on Principles and Practice of Parallel Programming (May 1993)","DOI":"10.1145\/155332.155333"},{"issue":"12","key":"4_CR7","doi-asserted-by":"publisher","first-page":"1390","DOI":"10.1109\/TPDS.2006.165","volume":"17","author":"J. Bosque","year":"2006","unstructured":"Bosque, J., Pastor, L.: A Parallel Computational Model for Heterogeneous Clusters. IEEE Transactions on Parallel and Distributed Systems\u00a017(12), 1390\u20131400 (2006)","journal-title":"IEEE Transactions on Parallel and Distributed Systems"},{"issue":"5","key":"4_CR8","doi-asserted-by":"publisher","first-page":"519","DOI":"10.1007\/BF02577777","volume":"22","author":"M. Girkar","year":"1994","unstructured":"Girkar, M., Polychronopoulos, C.: The Hierarchical Task Graph as a Universal Intermediate Representation. International Journal of Parallel Programming\u00a022(5), 519\u2013551 (1994)","journal-title":"International Journal of Parallel Programming"},{"key":"4_CR9","doi-asserted-by":"crossref","unstructured":"Gropp, W., Lusk, E.: Reproducible Measurements of MPI Performance Characteristics. In: Proc. of the 6th European PVM\/MPI User\u2019s Group Meeting, Barcelona, Spain, pp. 11\u201318 (September 1999)","DOI":"10.1007\/3-540-48158-3_2"},{"key":"4_CR10","doi-asserted-by":"crossref","unstructured":"Feng, X., Cameron, K., Buell, D.: PBPI: a high performance Implementation of Bayesian Phylogenetic Inference. In: Proc. of Supercomputing 2006, Tampa, FL (November 2006)","DOI":"10.1109\/SC.2006.47"},{"issue":"7-8","key":"4_CR11","doi-asserted-by":"publisher","first-page":"707","DOI":"10.1016\/S0743-7315(03)00079-0","volume":"63","author":"X. Feng","year":"2003","unstructured":"Feng, X., Buell, D., Rose, J., Waddell, P.: Parallel algorithms for bayesian phylogenetic inference. Journal of Parallel Distributed Computing\u00a063(7-8), 707\u2013718 (2003)","journal-title":"Journal of Parallel Distributed Computing"},{"key":"4_CR12","doi-asserted-by":"crossref","unstructured":"Feng, X., Cameron, K., Smith, B., Sosa, C.: Building the Tree of Life on Terascale Systems. In: Proc. of the 21st International Parallel and Distributed Processing Symposium, Long Beach, CA (March 2007)","DOI":"10.1109\/IPDPS.2007.370214"},{"issue":"8","key":"4_CR13","doi-asserted-by":"publisher","first-page":"103","DOI":"10.1145\/79173.79181","volume":"22","author":"L. Valiant","year":"1990","unstructured":"Valiant, L.: A bridging model for parallel computation. Communications of the ACM\u00a022(8), 103\u2013111 (1990)","journal-title":"Communications of the ACM"},{"key":"4_CR14","doi-asserted-by":"crossref","unstructured":"Cameron, K., Sun, X.: Quantifying Locality Effect in Data Access Delay: Memory LogP. In: Proc. of the 17th International Parallel and Distributed Processing Symposium, Nice, France (April 2003)","DOI":"10.1109\/IPDPS.2003.1213137"},{"key":"4_CR15","doi-asserted-by":"crossref","unstructured":"Alexandrov, A., Ionescu, M., Schauser, C., Scheiman, C.: LogGP: Incorporating Long Messages into the LogP Model: One Step Closer towards a Realistic Model for Parallel Computation. In: Proc. of the 7th Annual ACM Symposium on Parallel Algorithms and Architectures, Santa Barbara, CA, pp. 95\u2013105 (June 1995)","DOI":"10.1145\/215399.215427"},{"key":"4_CR16","series-title":"Lecture Notes in Computer Science","volume-title":"Open Hypermedia Systems and Structural Computing","author":"F. Cappello","year":"2000","unstructured":"Cappello, F., Etiemble, D.: MPI vs. MPI+OpenMP on the IBM SP for the NAS Benchmarks. In: Reich, S., Anderson, K.M. (eds.) Open Hypermedia Systems and Structural Computing. LNCS, vol.\u00a01903, Springer, Heidelberg (2000)"},{"key":"4_CR17","doi-asserted-by":"crossref","unstructured":"Krawezik, G.: Performance Comparison of MPI and three OpenMP Programming Styles on Shared Memory Multiprocessors. In: Proc. of the 15th Annual ACM Symposium on Parallel Algorithms and Architectures (2003)","DOI":"10.1145\/777412.777433"},{"key":"4_CR18","doi-asserted-by":"crossref","unstructured":"Sharapov, I., Kroeger, R., Delamater, G., Cheveresan, R., Ramsay, M.: A Case Study in Top-Down Performance Estimation for a Large-Scale Parallel Application. In: Proc. of the 11th ACM SIGPLAN Symposium on Pronciples and Practice of Parallel Programming, New York, pp. 81\u201389 (March 2006)","DOI":"10.1145\/1122971.1122985"}],"container-title":["Lecture Notes in Computer Science","High Performance Embedded Architectures and Compilers"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-540-77560-7_4.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,4,27]],"date-time":"2021-04-27T10:44:29Z","timestamp":1619520269000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-540-77560-7_4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[null]]},"ISBN":["9783540775591","9783540775607"],"references-count":18,"URL":"https:\/\/doi.org\/10.1007\/978-3-540-77560-7_4","relation":{},"subject":[]}}