{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,21]],"date-time":"2026-03-21T19:22:19Z","timestamp":1774120939353,"version":"3.50.1"},"reference-count":46,"publisher":"Springer Science and Business Media LLC","issue":"6","license":[{"start":{"date-parts":[[2014,10,26]],"date-time":"2014-10-26T00:00:00Z","timestamp":1414281600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Parallel Prog"],"published-print":{"date-parts":[[2015,12]]},"DOI":"10.1007\/s10766-014-0336-3","type":"journal-article","created":{"date-parts":[[2014,10,25]],"date-time":"2014-10-25T02:51:45Z","timestamp":1414205505000},"page":"1004-1027","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":8,"title":["Invasive Compute Balancing for Applications with Shared and Hybrid Parallelization"],"prefix":"10.1007","volume":"43","author":[{"given":"Martin","family":"Schreiber","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Christoph","family":"Riesinger","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tobias","family":"Neckel","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hans-Joachim","family":"Bungartz","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Alexander","family":"Breuer","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2014,10,26]]},"reference":[{"key":"336_CR1","doi-asserted-by":"crossref","unstructured":"Aizinger, V.: A discontinuous Galerkin method for two-dimensional flow and transport in shallow water. Adv. Water Resour. 25, 67\u201384 (2002)","DOI":"10.1016\/S0309-1708(01)00019-7"},{"key":"336_CR2","doi-asserted-by":"crossref","unstructured":"Al Faruque, M.A., Krist, R., Henkel, J.: ADAM: run-time agent-based distributed application mapping for on-chip communication. In: Proceedings of the 45th Annual Design Automation Conference, ACM, New York, NY, USA, DAC \u201908, pp. 760\u2013765 (2008)","DOI":"10.1145\/1391469.1391664"},{"key":"336_CR3","doi-asserted-by":"crossref","unstructured":"Bader, M., Breuer, A., Schreiber, M.: Parallel fully adaptive tsunami simulations. In: Facing the Multicore-Challenge III, Institut f\u00fcr Informatik, Technische Universit\u00e4t M\u00fcnchen, Springer, Heidelberg, Germany. Lecture Notes in Computer Science, vol. 7686 (2012a)","DOI":"10.1007\/978-3-642-35893-7_19"},{"key":"336_CR4","doi-asserted-by":"crossref","unstructured":"Bader, M., Bungartz, H.J., Schreiber, M.: Invasive computing on high performance shared memory systems. In: Facing the Multicore-Challenge III. Lecture Notes in Computer Science, vol. 7686, pp. 1\u201312. Springer (2012b)","DOI":"10.1007\/978-3-642-35893-7_1"},{"key":"336_CR5","doi-asserted-by":"crossref","unstructured":"Bangerth, W., Hartmann, R., Kanschat, G.: Deal.II\u2014a general purpose object oriented finite element library. ACM Trans. Math. Softw. 33(4), 1\u201327 (2007)","DOI":"10.1090\/S0002-9947-06-03836-0"},{"key":"336_CR6","doi-asserted-by":"crossref","unstructured":"Becchi, M., Crowley, P.: Dynamic thread assignment on heterogeneous multiprocessor architectures. In: Proceedings of the 3rd Conference on Computing Frontiers, ACM, New York, NY, USA, CF \u201906, pp. 29\u201340 (2006)","DOI":"10.1145\/1128022.1128029"},{"key":"336_CR7","doi-asserted-by":"crossref","unstructured":"Behrens, J.: Efficiency for adaptive triangular meshes: key issues of future approaches. In: Hamilton, K., Lohmann, G., Mysak, L. A. (eds.) Earth System Modelling, vol. 2. Springer (2012)","DOI":"10.1007\/978-3-642-23831-4_5"},{"key":"336_CR8","doi-asserted-by":"crossref","unstructured":"Bhadauria, M., McKee, S.: An approach to resource-aware co-scheduling for CMPs. In: Proceedings of the 24th ACM International Conference on Supercomputing, ACM, ICS \u201910, pp. 189\u2013199 (2010)","DOI":"10.1145\/1810085.1810113"},{"key":"336_CR9","unstructured":"BODC.: Centenary Edition of the GEBCO Digital Atlas (2013)"},{"key":"336_CR10","unstructured":"Bolosky, W.J., Scott, M.L.: False sharing and its effect on shared memory performance. In: 4th Symposium on Experimental Distributed and Multiprocessor Systems, pp. 57\u201371 (1993)"},{"issue":"3","key":"336_CR11","doi-asserted-by":"crossref","first-page":"1103","DOI":"10.1137\/100791634","volume":"33","author":"C Burstedde","year":"2011","unstructured":"Burstedde, C., Wilcox, L.C., Ghattas, O.: p4est: scalable algorithms for parallel adaptive mesh refinement on forests of octrees. SIAM J. Sci. Comput. 33(3), 1103\u20131133 (2011). doi: 10.1137\/100791634","journal-title":"SIAM J. Sci. Comput."},{"key":"336_CR12","doi-asserted-by":"crossref","first-page":"4613","DOI":"10.1098\/rsta.2009.0158","volume":"367","author":"C Castro","year":"2009","unstructured":"Castro, C., K\u00e4ser, M., Toro, E.: Space-time adaptive numerical methods for geophysical applications. Philos. Trans. R. Soc. A Math. Phys. Eng. Sci. 367, 4613\u20134631 (2009)","journal-title":"Philos. Trans. R. Soc. A Math. Phys. Eng. Sci."},{"key":"336_CR13","unstructured":"Corbal\u00e1n, J., Martorell, X., Labarta, J.: Performance-driven processor allocation. In: Proceedings of the 4th Conference on Symposium on Operating System Design & Implementation, vol. 4 (2000)"},{"issue":"7","key":"336_CR14","doi-asserted-by":"crossref","first-page":"599","DOI":"10.1109\/TPDS.2005.85","volume":"16","author":"J Corbalan","year":"2005","unstructured":"Corbalan, J., Martorell, X., Labarta, J.: Performance-driven processor allocation. IEEE Trans. Parallel Distrib. Syst. 16(7), 599\u2013611 (2005)","journal-title":"IEEE Trans. Parallel Distrib. Syst."},{"key":"336_CR15","doi-asserted-by":"crossref","unstructured":"De Grande, R., Boukerche, A.: Dynamic load redistribution based on migration latency analysis for distributed virtual simulations. In: 2011 IEEE International Workshop on Haptic Audio Visual Environments and Games (HAVE), pp. 88\u201393 (2011). doi: 10.1109\/HAVE.2011.6088397","DOI":"10.1109\/HAVE.2011.6088397"},{"key":"336_CR16","doi-asserted-by":"crossref","unstructured":"Drosinos, N., Koziris, N.: Performance comparison of pure MPI vs hybrid MPI-OpenMP parallelization models on SMP clusters. In: Parallel and Distributed Processing Symposium 2004 IEEE (2004)","DOI":"10.1109\/IPDPS.2004.1302919"},{"issue":"1","key":"336_CR17","doi-asserted-by":"crossref","first-page":"65","DOI":"10.1016\/0097-8493(93)90052-B","volume":"17","author":"JS Falby","year":"1993","unstructured":"Falby, J.S., Zyda, M.J., Pratt, D.R., Mackey, R.L.: NPSNET: hierarchical data structures for real-time three-dimensional visual simulation. Comput. Graph. 17(1), 65\u201369 (1993)","journal-title":"Comput. Graph."},{"key":"336_CR18","doi-asserted-by":"crossref","first-page":"386","DOI":"10.1145\/1013812.18215","volume":"16","author":"BD Fleisch","year":"1986","unstructured":"Fleisch, B.D.: Distributed system V IPC in LOCUS: a design and implementation retrospective. ACM SIGCOMM Comput. Commun. Rev. ACM 16, 386\u2013396 (1986)","journal-title":"ACM SIGCOMM Comput. Commun. Rev. ACM"},{"issue":"2","key":"336_CR19","doi-asserted-by":"crossref","first-page":"163","DOI":"10.1093\/comjnl\/6.2.163","volume":"6","author":"R Fletcher","year":"1963","unstructured":"Fletcher, R., Powell, M.J.: A rapidly convergent descent method for minimization. Comput. J. 6(2), 163\u2013168 (1963)","journal-title":"Comput. J."},{"key":"336_CR20","doi-asserted-by":"crossref","unstructured":"Garcia, M., Corbalan, J., Badia Maria, R., Labarta, J.: A dynamic load balancing approach with SMPSuperscalar and MPI. In: Keller, R., Kramer, D., Weiss, J.P. (eds.) Facing the Multicore-Challenge II, Springer Berlin Heidelberg, Stuttgart (2012)","DOI":"10.1007\/978-3-642-30397-5_2"},{"issue":"6","key":"336_CR21","doi-asserted-by":"crossref","first-page":"3089","DOI":"10.1016\/j.jcp.2007.10.027","volume":"227","author":"D George","year":"2008","unstructured":"George, D.: Augmented Riemann solvers for the shallow water equations over variable topography with steady states and inundation. J. Comput. Phys. 227(6), 3089\u20133113 (2008)","journal-title":"J. Comput. Phys."},{"key":"336_CR22","unstructured":"Gerndt, M., Hollmann, A., Meyer, M., Schreiber, M., Weidendorfer, J.: Invasive computing with iOMP. In: Specification and Design Languages (FDL), pp. 225\u2013231. IEEE, Vienna (2012)"},{"key":"336_CR23","doi-asserted-by":"crossref","unstructured":"Hesthaven, J.S., Warburton, T.: Nodal Discontinuous Galerkin Methods: Algorithms, Analysis, and Applications, pp. 97\u2013107. Springer Verlag, New York (2008)","DOI":"10.1007\/978-0-387-72067-8"},{"key":"336_CR24","unstructured":"Hsieh, W.C.Y.: Dynamic computation migration in distributed shared memory systems. PhD thesis, MIT (1995)"},{"key":"336_CR25","doi-asserted-by":"crossref","unstructured":"Keyes, D.E.: Four horizons for enhancing the performance of parallel simulations based on partial differential equations. In: Euro-Par 2000 Parallel Processing, pp. 1\u201317. Springer (2000)","DOI":"10.1007\/3-540-44520-X_1"},{"key":"336_CR26","doi-asserted-by":"crossref","unstructured":"Kobbe, S., Bauer, L., Lohmann, D., Schr\u00f6der-Preikschat, W., Henkel, J.: DistRM: Distributed resource management for on-chip many-core systems. In: Proceedings of the Seventh IEEE\/ACM\/IFIP International Conference on Hardware\/Software Codesign and System Synthesis, ACM, pp. 119\u2013128 (2011)","DOI":"10.1145\/2039370.2039392"},{"key":"336_CR27","doi-asserted-by":"crossref","unstructured":"Li, D., De Supinski, B., Schulz, M., Cameron, K., Nikolopoulos, D.: Hybrid MPI\/OpenMP power-aware computing. In: Parallel Distributed Processing (IPDPS), pp. 1\u201312 (2010)","DOI":"10.1109\/IPDPS.2010.5470463"},{"key":"336_CR28","doi-asserted-by":"crossref","unstructured":"Meister, O., Rahnema, K., Bader, M.: A software concept for cache-efficient simulation on dynamically adaptive structured triangular grids. In: PARCO, pp. 251\u2013260 (2011)","DOI":"10.3233\/978-1-61499-041-3-251"},{"key":"336_CR29","doi-asserted-by":"crossref","first-page":"35","DOI":"10.1145\/996893.996848","volume":"39","author":"MM Michael","year":"2004","unstructured":"Michael, M.M.: Scalable lock-free dynamic memory allocation. ACM SIGPLAN Not. ACM 39, 35\u201346 (2004)","journal-title":"ACM SIGPLAN Not. ACM"},{"key":"336_CR30","unstructured":"Neckel, T.: The PDE framework peano: an environment for efficient flow simulations. Dissertation, Institut f\u00fcr Informatik, Technische Universit\u00e4t M\u00fcnchen (2009)"},{"key":"336_CR31","doi-asserted-by":"crossref","unstructured":"Nogina, S., Unterweger, K., Weinzierl, T.: Autotuning of adaptive mesh refinement PDE solvers on shared memory architectures. In: PPAM 2011. Lecture Notes in Computer Science, vol. 7203, pp. 671\u2013680. Springer, Heidelberg (2012)","DOI":"10.1007\/978-3-642-31464-3_68"},{"key":"336_CR32","volume-title":"Intel Threading Building Blocks: Outfitting C++ for Multi-core Processor Parallelism","author":"J Reinders","year":"2010","unstructured":"Reinders, J.: Intel Threading Building Blocks: Outfitting C++ for Multi-core Processor Parallelism. O\u2019Reilly Media Inc, Sebastopol (2010)"},{"key":"336_CR33","doi-asserted-by":"crossref","unstructured":"Rosu, D., Schwan, K., Yalamanchili, S., Jha, R.: On adaptive resource allocation for complex real-time applications. In: Proceedings of the 18th IEEE Real-Time Systems Symposium, IEEE Computer Society, Washington, DC, USA, RTSS \u201997, p. 320 (1997). doi: 10.1109\/REAL.1997.641293","DOI":"10.1109\/REAL.1997.641293"},{"issue":"1","key":"336_CR34","doi-asserted-by":"crossref","first-page":"230","DOI":"10.1137\/0730011","volume":"30","author":"U R\u00fcde","year":"1993","unstructured":"R\u00fcde, U.: Fully adaptive multigrid methods. SIAM J. Numer. Anal. 30(1), 230\u2013248 (1993)","journal-title":"SIAM J. Numer. Anal."},{"key":"336_CR35","doi-asserted-by":"crossref","unstructured":"Rusanov, V.V.: Calculation of interaction of non-steady shock waves with obstacles. NRC, Division of Mechanical Engineering (1962)","DOI":"10.1016\/0041-5553(62)90062-9"},{"key":"336_CR36","doi-asserted-by":"crossref","DOI":"10.1007\/978-1-4612-0871-6","volume-title":"Space-Filling Curves","author":"H Sagan","year":"1994","unstructured":"Sagan, H.: Space-Filling Curves, vol. 18. Springer, New York (1994)"},{"key":"336_CR37","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"crossref","first-page":"547","DOI":"10.1007\/978-3-642-40047-6_56","volume-title":"Euro-Par 2013 Parallel Processing","author":"D Schmidl","year":"2013","unstructured":"Schmidl, D., Cramer, T., Wienke, S., Terboven, C., M\u00fcller, M.: Assessing the performance of openmp programs on the intel xeon phi. In: Wolf, F., Mohr, B., Mey, D. (eds.) Euro-Par 2013 Parallel Processing. Lecture Notes in Computer Science, vol. 8097, pp. 547\u2013558. Springer, Berlin (2013)"},{"key":"336_CR38","doi-asserted-by":"crossref","unstructured":"Schreiber, M., Bungartz, H.J., Bader, M.: Shared memory parallelization of fully-adaptive simulations using a dynamic tree-split and -join approach. In: IEEE International Conference on High Performance Computing (HiPC), IEEE Xplore, Puna, India (2012)","DOI":"10.1109\/HiPC.2012.6507479"},{"key":"336_CR39","doi-asserted-by":"crossref","unstructured":"Schreiber, M., Weinzierl, T., Bungartz, H.J.: Cluster optimization of parallel simulations with dynamically adaptive grids. In: EuroPar 2013, Aachen, Germany (2013a)","DOI":"10.1007\/978-3-642-40047-6_50"},{"key":"336_CR40","unstructured":"Schreiber, M., Weinzierl, T., Bungartz, H.J.: SFC-based communication metadata encoding for adaptive mesh. In: Proceedings of the International Conference on Parallel Computing (ParCo) (2013b)"},{"issue":"7","key":"336_CR41","doi-asserted-by":"crossref","first-page":"559","DOI":"10.5047\/eps.2011.06.028","volume":"63","author":"G Shao","year":"2011","unstructured":"Shao, G., Li, X., Ji, C., Maeda, T.: Focal mechanism and slip history of the 2011 Mw 9.1 off the Pacific coast of Tohoku Earthquake, constrained with teleseismic body and surface waves. Earth Planets Space 63(7), 559\u2013564 (2011)","journal-title":"Earth Planets Space"},{"key":"336_CR42","doi-asserted-by":"crossref","unstructured":"Teich, J., Henkel, J., Herkersdorf, A., Schmitt-Landsiedel, D., Schr\u00f6der-Preikschat, W., Snelting, G.: Invasive computing: an overview. In: Multiprocessor SoC, pp. 241\u2013268. Springer (2011)","DOI":"10.1007\/978-1-4419-6460-1_11"},{"key":"336_CR43","doi-asserted-by":"crossref","unstructured":"Tradowsky, C., Schreiber, M., Vesper, M., Domladovec, I., Braun, M., Bungartz, H.J., Becker, J.: Towards Dynamic Cache and Bandwidth Invasion, pp. 97\u2013107. Springer International Publishing (2014)","DOI":"10.1007\/978-3-319-05960-0_9"},{"key":"336_CR44","unstructured":"Vigh, C.A.: Parallel simulations of the shallow water equations on structured dynamically adaptive triangular grids. Dissertation, Institut f\u00fcr Informatik, Technische Universit\u00e4t M\u00fcnchen (2012)"},{"key":"336_CR45","doi-asserted-by":"crossref","unstructured":"Vuchener, C., Esnard, A.: Dynamic load-balancing with variable number of processors based on graph repartitioning. In: Proceedings of High Performance Computing (HiPC 2012), pp. 1\u20139 (2012)","DOI":"10.1109\/HiPC.2012.6507501"},{"key":"336_CR46","unstructured":"Weinzierl, T.: A framework for parallel PDE solvers on multiscale adaptive cartesian grids. Dissertation, Institut f\u00fcr Informatik, Technische Universit\u00e4t M\u00fcnchen, M\u00fcnchen (2009)"}],"container-title":["International Journal of Parallel Programming"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10766-014-0336-3.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10766-014-0336-3\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10766-014-0336-3","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,5]],"date-time":"2025-05-05T13:34:30Z","timestamp":1746452070000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10766-014-0336-3"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2014,10,26]]},"references-count":46,"journal-issue":{"issue":"6","published-print":{"date-parts":[[2015,12]]}},"alternative-id":["336"],"URL":"https:\/\/doi.org\/10.1007\/s10766-014-0336-3","relation":{},"ISSN":["0885-7458","1573-7640"],"issn-type":[{"value":"0885-7458","type":"print"},{"value":"1573-7640","type":"electronic"}],"subject":[],"published":{"date-parts":[[2014,10,26]]}}}