{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,1,21]],"date-time":"2025-01-21T05:10:30Z","timestamp":1737436230838,"version":"3.33.0"},"publisher-location":"Berlin, Heidelberg","reference-count":35,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540430094"},{"type":"electronic","value":"9783540453079"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2001]]},"DOI":"10.1007\/3-540-45307-5_21","type":"book-chapter","created":{"date-parts":[[2007,8,16]],"date-time":"2007-08-16T11:10:12Z","timestamp":1187262612000},"page":"237-248","source":"Crossref","is-referenced-by-count":13,"title":["Towards Automatic Synthesis of High-Performance Codes for Electronic Structure Calculations: Data Locality Optimization"],"prefix":"10.1007","author":[{"given":"D.","family":"Cociorva","sequence":"first","affiliation":[]},{"given":"J.","family":"Wilkins","sequence":"additional","affiliation":[]},{"given":"G.","family":"Baumgartner","sequence":"additional","affiliation":[]},{"given":"P.","family":"Sadayappan","sequence":"additional","affiliation":[]},{"given":"J.","family":"Ramanujam","sequence":"additional","affiliation":[]},{"given":"M.","family":"Nooijen","sequence":"additional","affiliation":[]},{"given":"D.","family":"Bernholdt","sequence":"additional","affiliation":[]},{"given":"R.","family":"Harrison","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2001,12,4]]},"reference":[{"key":"21_CR1","doi-asserted-by":"crossref","unstructured":"N. Ahmed, N. Mateev, and K. Pingali. Synthesizing transformations for locality enhancementof imperfectly-nested loops. ACM Intl. Conf. on Supercomputing, 2000.","DOI":"10.1145\/335231.335245"},{"key":"21_CR2","volume-title":"Parallel Implementation of Quasiparticle Calculations of Semiconductors andInsulators","author":"W. Aulbur","year":"1996","unstructured":"W. Aulbur. Parallel Implementation of Quasiparticle Calculations of Semiconductors andInsulators, Ph.D. Dissertation, Ohio State University, Columbus, OH, October 1996."},{"key":"21_CR3","doi-asserted-by":"crossref","unstructured":"J. Bilmes, K. Asanovic, C. Chin, and J. Demmel. Optimizing matrix multiply using PHiPAC.In Proc. ACM International Conference on Supercomputing, pp. 340\u2013347, 1997.","DOI":"10.1145\/263580.263662"},{"key":"21_CR4","doi-asserted-by":"crossref","unstructured":"D. Cociorva, J. Wilkins, C.-C. Lam, G. Baumgartner, P. Sadayappan, and J. Ramanujam.Loop optimization for a class of memory-constrained computations. In Proc. 15th ACM InternationalConference on Supercomputing, pp. 500\u2013509, Sorrento, Italy, June 2001.","DOI":"10.1145\/377792.377814"},{"key":"21_CR5","first-page":"1381","volume":"3","author":"M. Frigo","year":"1998","unstructured":"M. Frigo and S. Johnson. FFTW: An adaptive software architecture for the FFT. In Proc.ICASSP 98, Volume 3, pages 1381\u20131384, 1998, http:\/\/www.fftw.org .","journal-title":"Proc.ICASSP 98"},{"key":"21_CR6","doi-asserted-by":"crossref","unstructured":"G. Gao, R. Olsen, V. Sarkar and R. Thekkath. Collective Loop Fusion for Array Contraction.Proc. 5th LCPC Workshop New Haven, CT, Aug. 1992.","DOI":"10.1007\/3-540-57502-2_53"},{"key":"21_CR7","doi-asserted-by":"crossref","unstructured":"S. Ghosh, M. Martonosi and S. Malik. Precise Miss Analysis for Program Transformationswith Caches of Arbitrary Associativity. 8th ACM Intl. Conf. on Architectural Support forProgramming Languages and Operating Systems, San Jose, CA, Oct. 1998.","DOI":"10.1145\/291069.291051"},{"key":"21_CR8","doi-asserted-by":"crossref","first-page":"5390","DOI":"10.1103\/PhysRevB.34.5390","volume":"34","author":"M. S. Hybertsen","year":"1986","unstructured":"M. S. Hybertsen and S. G. Louie. Electronic correlation in semiconductors and insulators:band gaps and quasiparticle energies. Phys. Rev. B, 34:5390, 1986.","journal-title":"Phys. Rev. B"},{"issue":"4","key":"21_CR9","doi-asserted-by":"publisher","first-page":"449","DOI":"10.1007\/BF01189337","volume":"9","author":"J. Johnson","year":"1990","unstructured":"J. Johnson, R. Johnson, D. Rodriguez, and R. Tolimieri. A methodology for designing, modifying,and implementing Fourier transform algorithms on various architectures. Circuits,Systems and Signal Processing, 9(4):449\u2013500, 1990.","journal-title":"Circuits,Systems and Signal Processing"},{"key":"21_CR10","doi-asserted-by":"crossref","unstructured":"K. Kennedy et. al., Telescoping Languages: A Strategy for Automatic Generation of ScientificProblem-Solving Systems from Annotated Libraries. To appear in Journal of Paralleland Distributed Computing, 2001.","DOI":"10.1006\/jpdc.2001.1724"},{"key":"21_CR11","doi-asserted-by":"crossref","unstructured":"K. Kennedy. Fast greedy weighted fusion. ACM Intl. Conf. on Supercomputing, May 2000.","DOI":"10.1145\/335231.335244"},{"key":"21_CR12","doi-asserted-by":"crossref","unstructured":"I. Kodukula, N. Ahmed, and K. Pingali. Data-centric multi-level blocking. In Proc. SIGPLANConf. Programming Language Design and Implementation, June 1997.","DOI":"10.1145\/258915.258946"},{"key":"21_CR13","doi-asserted-by":"crossref","unstructured":"I. Kodukula, K. Pingali, R. Cox, and D. Maydan. An experimental evaluation of tiling andshackling for memory hierarchy management. In Proc. ACM International Conference onSupercomputing (ICS 99), Rhodes, Greece, June 1999.","DOI":"10.1145\/305138.305243"},{"key":"21_CR14","volume-title":"Performance Optimization of a Class of Loops Implementing Multi-DimensionalIntegrals","author":"C. Lam","year":"1999","unstructured":"C. Lam. Performance Optimization of a Class of Loops Implementing Multi-DimensionalIntegrals, Ph.D. Dissertation, The Ohio State University, Columbus, OH, August 1999."},{"key":"21_CR15","doi-asserted-by":"crossref","unstructured":"C. Lam, D. Cociorva, G. Baumgartner and P. Sadayappan. Optimization of Memory Usageand Communication Requirements for a Class of Loops Implementing Multi-DimensionalIntegrals. Proc. 12th LCPC Workshop San Diego, CA, Aug. 1999.","DOI":"10.1007\/3-540-44905-1_22"},{"key":"21_CR16","doi-asserted-by":"crossref","unstructured":"C. Lam, D. Cociorva, G. Baumgartner, and P. Sadayappan. Memory-optimal evaluation ofexpression trees involving large objects. In Proc. Intl. Conf. on High Perf. Comp., Dec. 1999.","DOI":"10.1007\/978-3-540-46642-0_15"},{"key":"21_CR17","doi-asserted-by":"crossref","unstructured":"C. Lam, P. Sadayappan, and R. Wenger. Optimal reordering and mapping of a class ofnested-loops for parallel execution. In 9th LCPC Workshop, San Jose, Aug. 1996.","DOI":"10.1007\/BFb0017261"},{"issue":"2","key":"21_CR18","doi-asserted-by":"publisher","first-page":"157","DOI":"10.1142\/S0129626497000176","volume":"7","author":"C. Lam","year":"1997","unstructured":"C. Lam, P. Sadayappan and R. Wenger. On Optimizing a Class of Multi-Dimensional Loopswith Reductions for Parallel Execution. Par. Proc. Lett., (7) 2, pp. 157\u2013168, 1997.","journal-title":"Par. Proc. Lett."},{"key":"21_CR19","unstructured":"C. Lam, P. Sadayappan and R. Wenger. Optimization of a Class of Multi-Dimensional Integralson Parallel Machines. Proc. of Eighth SIAM Conf. on Parallel Processing for ScientificComputing, Minneapolis, MN, March 1997."},{"key":"21_CR20","doi-asserted-by":"crossref","unstructured":"M. S. Lam, E. E. Rothberg, and M. E. Wolf. The cache performance and optimizations ofblocked algorithms. In Proc. of Fourth Intl. Conf. on Architectural Support for ProgrammingLanguages and Operating Systems, April 1991.","DOI":"10.1145\/106972.106981"},{"key":"21_CR21","doi-asserted-by":"crossref","unstructured":"T. J. Lee and G. E. Scuseria. Achieving chemical accuracy with coupled cluster theory. InS.R. Langhoff (Ed.), Quantum Mechanical Electronic Structure Calculations with ChemicalAccuracy, pp. 47\u2013109, Kluwer Academic, 1997.","DOI":"10.1007\/978-94-011-0193-6_2"},{"key":"21_CR22","doi-asserted-by":"crossref","unstructured":"W. Li. Compiler cache optimizations for banded matrix problems. In International Conferenceon Supercomputing, Barcelona, Spain, July 1995.","DOI":"10.1145\/224538.224541"},{"key":"21_CR23","unstructured":"J. M. L. Martin. InP. v. R. Schleyer, P. R. Schreiner, N. L. Allinger, T. Clark, J. Gasteiger, P. Kollman, H. F. SchaeferIII (Eds.), Encyclopedia of Computational Chemistry. Wiley &Sons, Berne (Switzerland). Vol. 1, pp. 115\u2013128, 1998."},{"issue":"4","key":"21_CR24","doi-asserted-by":"publisher","first-page":"424","DOI":"10.1145\/233561.233564","volume":"18","author":"K. S. McKinley","year":"1996","unstructured":"K. S. McKinley, S. Carr and C.-W. Tseng. Improving Data Locality with Loop Transformations.ACM TOPLAS, 18(4):424\u2013453, July 1996.","journal-title":"ACM TOPLAS"},{"issue":"6","key":"21_CR25","doi-asserted-by":"publisher","first-page":"641","DOI":"10.1023\/A:1018782528453","volume":"26","author":"N. Mitchell","year":"1998","unstructured":"N. Mitchell, K. H\u00f6gstedt, L. Carter, and J. Ferrante. Quantifying the multi-level nature oftiling interactions. Intl. Journal of Parallel Programming, 26(6):641\u2013670, June 1998.","journal-title":"Intl. Journal of Parallel Programming"},{"key":"21_CR26","doi-asserted-by":"crossref","unstructured":"G. Rivera and C.-W. Tseng. Data Transformations for Eliminating Conflict Misses. ACMSIGPLAN PLDI, June 1998.","DOI":"10.1145\/277650.277661"},{"key":"21_CR27","doi-asserted-by":"crossref","unstructured":"G. Rivera and C.-W. Tseng. Eliminating Conflict Misses for High Performance Architectures.Proc. of 1998 Intl. Conf. on Supercomputing, July 1998.","DOI":"10.1145\/277830.277917"},{"key":"21_CR28","doi-asserted-by":"publisher","first-page":"1827","DOI":"10.1103\/PhysRevLett.74.1827","volume":"74","author":"H. N. Rojas","year":"1995","unstructured":"H. N. Rojas, R.W. Godby, and R. J. Needs. Space-time method for Ab-initio calculations ofself-energies and dielectric response functions of solids. Phys. Rev. Lett., 74:1827, 1995.","journal-title":"Phys. Rev. Lett."},{"issue":"6","key":"21_CR29","doi-asserted-by":"publisher","first-page":"340","DOI":"10.1093\/comjnl\/40.6.340","volume":"40","author":"S. Singhai","year":"1997","unstructured":"S. Singhai and K. S. McKinley. A Parameterized Loop Fusion Algorithm for ImprovingParallelism and Cache Locality. The Computer Journal, 40(6):340\u2013355, 1997.","journal-title":"The Computer Journal"},{"key":"21_CR30","doi-asserted-by":"crossref","unstructured":"Y. Song and Z. Li. New Tiling Techniques to Improve Cache Temporal Locality. ACM SIGPLANPLDI, May 1999.","DOI":"10.1145\/301618.301668"},{"key":"21_CR31","doi-asserted-by":"crossref","unstructured":"M. Thottethodi, S. Chatterjee, and A. Lebeck. Tuning Strassen\u2019s matrix multiplication formemory hierarchies. In Proc. Supercomputing\u2019 98, Nov. 1998.","DOI":"10.1109\/SC.1998.10045"},{"key":"21_CR32","doi-asserted-by":"crossref","unstructured":"R. Whaley and J. Dongarra. Automatically Tuned Linear Algebra Software (ATLAS). InProc. Supercomputing\u2019 98, Nov. 1998.","DOI":"10.1109\/SC.1998.10004"},{"key":"21_CR33","unstructured":"M. E. Wolf and M. S. Lam. A Data Locality Algorithm. ACM SIGPLAN PLDI, June 1991."},{"key":"21_CR34","doi-asserted-by":"crossref","unstructured":"M. E. Wolf, D. E. Maydan, and D. J. Chen. Combining loop transformations consideringcaches and scheduling. In Proceedings of the 29th Annual International Symposium on Microarchitecture,pages 274\u2013286, Paris, France, December 2-4, 1996.","DOI":"10.1109\/MICRO.1996.566468"},{"key":"21_CR35","doi-asserted-by":"crossref","unstructured":"J. Xiong, D. Padua, and J. Johnson. SPL: A language and compiler for DSP algorithms. ACMSIGPLAN PLDI, June 2001.","DOI":"10.1145\/378795.378860"}],"container-title":["Lecture Notes in Computer Science","High Performance Computing \u2014 HiPC 2001"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/3-540-45307-5_21","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,20]],"date-time":"2025-01-20T11:36:17Z","timestamp":1737372977000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/3-540-45307-5_21"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2001]]},"ISBN":["9783540430094","9783540453079"],"references-count":35,"URL":"https:\/\/doi.org\/10.1007\/3-540-45307-5_21","relation":{},"ISSN":["0302-9743"],"issn-type":[{"type":"print","value":"0302-9743"}],"subject":[],"published":{"date-parts":[[2001]]}}}