{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,24]],"date-time":"2025-09-24T10:28:22Z","timestamp":1758709702931},"reference-count":28,"publisher":"Springer Science and Business Media LLC","issue":"2-3","license":[{"start":{"date-parts":[[2005,6,1]],"date-time":"2005-06-01T00:00:00Z","timestamp":1117584000000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Int J Parallel Prog"],"published-print":{"date-parts":[[2005,6]]},"DOI":"10.1007\/s10766-005-3581-7","type":"journal-article","created":{"date-parts":[[2005,7,19]],"date-time":"2005-07-19T10:46:01Z","timestamp":1121769961000},"page":"165-181","source":"Crossref","is-referenced-by-count":6,"title":["Empirical Optimization for a Sparse Linear Solver: A Case Study"],"prefix":"10.1007","volume":"33","author":[{"given":"Yoon-Ju","family":"Lee","sequence":"first","affiliation":[]},{"given":"Pedro C.","family":"Diniz","sequence":"additional","affiliation":[]},{"given":"Mary W.","family":"Hall","sequence":"additional","affiliation":[]},{"given":"Robert","family":"Lucas","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"3581_CR1","unstructured":"LS-DYNA User\u2019s Manual V. 960, Livermore Software Technology Corporation, http:\/\/www.lstc.com (March 2001)"},{"key":"3581_CR2","unstructured":"Ashcraft C., Lucas R.F A Stackless Multifrontal Method, in Proc. 10th SIAM Conference on Parallel Processing for Scientific Computing (March 2001)"},{"key":"3581_CR3","doi-asserted-by":"crossref","unstructured":"Baradaran N., Chame J., Chen C., Diniz P., Hall M., Lee Y., Liu B., Lucas R., ECO: An Empirical-based Compilation and Optimization System, in Proc. of the Workshop on Next Generation Software, held in conjunction with IPDPS\u201903 (April 2003)","DOI":"10.1109\/IPDPS.2003.1213377"},{"key":"3581_CR4","doi-asserted-by":"crossref","unstructured":"Chen C., Chame J., Hall M., Combining Models and Guided Empirical Search to Optimize for Multiple Levels of the Memory Hierarchy, in Int. Symposium on Code Generation and Optimization (CGO\u201905) (March, 2005)","DOI":"10.1109\/CGO.2005.10"},{"key":"3581_CR5","unstructured":"Diniz P., Liu B. Selector: An Effective Technique for Adaptive Computing, in Proc. of the 15th Workshop on Languages and Compilers for Parallel Computing (LCPC\u201902) (July, 2002)"},{"key":"3581_CR6","doi-asserted-by":"crossref","unstructured":"Lee Y., Hall M. A Code Isolator: Isolating Code Fragments from Large programs, in Proc. of the 17th Workshop on Languages and Compilers for Parallel Computing (LCPC\u201904) (September, 2004)","DOI":"10.1007\/11532378_13"},{"key":"3581_CR7","doi-asserted-by":"crossref","unstructured":"Vetter J.S., Worley P. Asserting Performance Expectations, in Proc. of Supercomputing\u201902 (November, 2002)","DOI":"10.1109\/SC.2002.10046"},{"key":"3581_CR8","unstructured":"Diniz P., Lee Y., Hall M., and Lucas R., A Case Study Using Empirical Optimization for a Large, Engineering Application, in Proc. of the Workshop on Next Generation Software, held in Conjunction with IPDPS\u201904 (April, 2003)"},{"key":"3581_CR9","doi-asserted-by":"crossref","unstructured":"Hall M., Amarasinghe S., Murphy B., Liao S., and Lam M., and M Lam, Interprocedural Parallelization Analysis in SUIF, in ACM Trans. on Programming Languages and Systems (2005)","DOI":"10.1145\/1075382.1075385"},{"key":"3581_CR10","unstructured":"MIPSpro C and C++ Pragmas, Document Number 007-3587-003, 1998, 1999 Silicon Graphics, Inc"},{"issue":"3","key":"3581_CR11","first-page":"400","volume":"15","author":"S. Carr","year":"July 1994","journal-title":"in ACM Trans. on Programming Languages and Systems (TOPLAS)"},{"key":"3581_CR12","unstructured":"London K., Dongarra J., Moore S., P Mucci, Seymour K., and T Spencer, End-user Tools for Application Performance Analysis, Using Hardware Counters, Intl. Conference on Parallel and Distributed Computing Systems (August, 2001)"},{"key":"3581_CR13","doi-asserted-by":"crossref","unstructured":"C. Whaley and Dongarra J., Automatically tuned linear algebra software, in. Proc. of Super-computing \u201998 (1998)","DOI":"10.1109\/SC.1998.10004"},{"key":"3581_CR14","doi-asserted-by":"crossref","unstructured":"Bilmes J., Asanovic K., C.-W. Chen, and Demmel J., Optimizing Matrix Multiply using PHiPAC: Portable High-Performance ANSI-C Coding Methodology, in Proc. of the ACM International Conference on Supercomputing \u201997 (1997)","DOI":"10.1145\/263580.263662"},{"key":"3581_CR15","doi-asserted-by":"crossref","unstructured":"D. Mirkovic and Johnsson SL., Automatic Performance Tuning in the UHFFT Library, in Proc. of the International conference on Computational Science (ICCS\u201901) (May, 2001)","DOI":"10.1007\/3-540-45545-0_17"},{"key":"3581_CR16","doi-asserted-by":"crossref","unstructured":"Frigo M., A Fast Fourier Transform Compiler, in Proc. of the ACM SIGPLAN Conference on Programming Language Design and Implementation (PLDI\u201999) (June, 1999)","DOI":"10.1145\/301618.301661"},{"key":"3581_CR17","doi-asserted-by":"crossref","unstructured":"Xiong J., Johnson J., Johnson R., and Padua D., SPL: A Language and Compiler for DSP Algorithms, in Proc. of the ACM Conference on Programming Language Design and Implementation (PLDI\u201901) (June, 2001)","DOI":"10.1145\/378795.378860"},{"key":"3581_CR18","doi-asserted-by":"crossref","unstructured":"M. Wolf and Lam M., A Data Locality Optimization Algorithm, in Proc. of the 1991 ACM SIGPLAN Conference on Programming Language Design and Implementation (PLDI\u201991) (June, 1991)","DOI":"10.1145\/113445.113449"},{"key":"3581_CR19","doi-asserted-by":"crossref","unstructured":"Wolfe M., More iteration space tiling, in Proc. of Supercomputing \u201989 (November, 1989)","DOI":"10.1145\/76263.76337"},{"key":"3581_CR20","doi-asserted-by":"crossref","unstructured":"J. Chame and Moon S., A Title Selection Algorithm for Data Locality and Cache Interference, in Proc. of the 1999 ACM International Conference on Supercomputing\u2019 99 (June, 1999)","DOI":"10.1145\/305138.305245"},{"key":"3581_CR21","doi-asserted-by":"crossref","unstructured":"S. Coleman and McKinley K., Tile Size Selection Using Cache Organization and Data Layout, in Proc. of the ACM SIGPLAN Conference on Programming Language Design and Implementation (PLDI\u201995) (June, 1995)","DOI":"10.1145\/207110.207162"},{"key":"3581_CR22","doi-asserted-by":"crossref","unstructured":"G. Rivera and C.-Tseng W., Data Transformations for Eliminating Conflict Misses, in Proc. of the ACM Conference on Programming Language Design and Implementation (PLDI\u201998) (June, 1998)","DOI":"10.1145\/277650.277661"},{"key":"3581_CR23","doi-asserted-by":"crossref","unstructured":"Lam M., Rothberg E., and Wolf M., The Cache Performance and Optimization of Blocked Algorithms, in Proc. of the 4th International conference on Architectural Support for Programming Languages and Operating Systems (ASPLOS\u201991) (April, 1991)","DOI":"10.1145\/106972.106981"},{"key":"3581_CR24","doi-asserted-by":"crossref","unstructured":"Chatterjee S., Parker E., Hanlon PJ., and Lebeck AR., Exact Analysis of the Cache Behavior of Nested Loops, in Proc. of the 2001 ACM SIGPLAN Conference on Programming Language Design and Implementation (PLDI\u201901) (June, 2001)","DOI":"10.1145\/378795.378859"},{"key":"3581_CR25","doi-asserted-by":"crossref","unstructured":"Ghosh S., Martonosi M., and Malik S., Precise Miss Analysis for Program Transformations with Caches of Arbitrary Associativity, in Proc. of the 8th International Conference on Architectural Support for Programming Languages and Operating Systems (ASPLOS\u201998) (October, 1998)","DOI":"10.1145\/291069.291051"},{"key":"3581_CR26","doi-asserted-by":"crossref","unstructured":"Temam O., Granston E., and Jalby W., To Copy or not to Copy: A Compile-time Technique for Assessing When Data Copying Should be Used to Eliminate Cache Conflicts, in Proc. of Supercomputing \u201993 (November, 1993)","DOI":"10.1145\/169627.169762"},{"key":"3581_CR27","doi-asserted-by":"crossref","unstructured":"M. Voss and Eigenmann R., High-Level Adaptive Program Optimization with ADAPT, in Proc. of the ACM SIGPLAN Conference on Principles and Practice of Parallel Processing (PPoPP\u201901) (June, 2001)","DOI":"10.1145\/379539.379583"},{"key":"3581_CR28","doi-asserted-by":"crossref","unstructured":"Adve V., Lam V., and Ensink B., Language and Compiler Support for Adaptive Distributed Applications, in Proc. of the ACM SIGPLAN Workshop on Optimization of Middleware and Distributed Systems (OM\u201901) (June, 2001)","DOI":"10.1145\/384198.384229"}],"container-title":["International Journal of Parallel Programming"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10766-005-3581-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10766-005-3581-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10766-005-3581-7","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,4,8]],"date-time":"2020-04-08T08:15:09Z","timestamp":1586333709000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10766-005-3581-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2005,6]]},"references-count":28,"journal-issue":{"issue":"2-3","published-print":{"date-parts":[[2005,6]]}},"alternative-id":["3581"],"URL":"https:\/\/doi.org\/10.1007\/s10766-005-3581-7","relation":{},"ISSN":["0885-7458","1573-7640"],"issn-type":[{"value":"0885-7458","type":"print"},{"value":"1573-7640","type":"electronic"}],"subject":[],"published":{"date-parts":[[2005,6]]}}}