{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T05:04:16Z","timestamp":1755839056211,"version":"3.40.3"},"publisher-location":"Cham","reference-count":26,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783030631703"},{"type":"electronic","value":"9783030631710"}],"license":[{"start":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T00:00:00Z","timestamp":1577836800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,1,1]],"date-time":"2020-01-01T00:00:00Z","timestamp":1577836800000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020]]},"DOI":"10.1007\/978-3-030-63171-0_8","type":"book-chapter","created":{"date-parts":[[2020,11,16]],"date-time":"2020-11-16T00:04:47Z","timestamp":1605485087000},"page":"145-162","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["PDAWL: Profile-Based Iterative Dynamic Adaptive WorkLoad Balance on Heterogeneous Architectures"],"prefix":"10.1007","author":[{"given":"Tongsheng","family":"Geng","sequence":"first","affiliation":[]},{"given":"Marcos","family":"Amaris","sequence":"additional","affiliation":[]},{"given":"St\u00e9phane","family":"Zuckerman","sequence":"additional","affiliation":[]},{"given":"Alfredo","family":"Goldman","sequence":"additional","affiliation":[]},{"given":"Guang R.","family":"Gao","sequence":"additional","affiliation":[]},{"given":"Jean-Luc","family":"Gaudiot","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2020,11,16]]},"reference":[{"issue":"4","key":"8_CR1","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3155288","volume":"14","author":"J Arteaga","year":"2017","unstructured":"Arteaga, J., Zuckerman, S., Gao, G.R.: Generating fine-grain multithreaded applications using a multigrain approach. ACM Trans. Archit. Code Optim. 14(4), 1\u201347 (2017). https:\/\/doi.org\/10.1145\/3155288","journal-title":"ACM Trans. Archit. Code Optim."},{"doi-asserted-by":"publisher","unstructured":"Barnes, B.J., Rountree, B., Lowenthal, D.K., Reeves, J., de Supinski, B., Schulz, M.: A regression-based approach to scalability prediction. In: Proceedings of the 22Nd Annual International Conference on Supercomputing, pp. 368\u2013377. ICS 2008, ACM, New York, USA (2008). https:\/\/doi.org\/10.1145\/1375527.1375580","key":"8_CR2","DOI":"10.1145\/1375527.1375580"},{"issue":"6","key":"8_CR3","doi-asserted-by":"publisher","first-page":"784","DOI":"10.1109\/TC.2017.2783932","volume":"67","author":"Q Chen","year":"2018","unstructured":"Chen, Q., Guo, M.: Contention and locality-aware work-stealing for iterative applications in multi-socket computers. IEEE Trans. Comput. 67(6), 784\u2013798 (2018). https:\/\/doi.org\/10.1109\/TC.2017.2783932","journal-title":"IEEE Trans. Comput."},{"key":"8_CR4","doi-asserted-by":"publisher","first-page":"219","DOI":"10.1016\/j.jpdc.2018.04.017","volume":"119","author":"E Chow","year":"2018","unstructured":"Chow, E., Anzt, H., Scott, J., Dongarra, J.: Using jacobi iterations and blocking for solving sparse triangular systems in incomplete factorization preconditioning. J. Parallel Distrib. Comput. 119, 219\u2013230 (2018)","journal-title":"J. Parallel Distrib. Comput."},{"doi-asserted-by":"publisher","unstructured":"Danalis, A., et al.: The scalable heterogeneous computing (SHOC) benchmark suite. In: Proceedings of the 3rd Workshop on General-Purpose Computation on Graphics Processing Units, pp. 63\u201374. GPGPU-3, ACM, New York, USA (2010). https:\/\/doi.org\/10.1145\/1735688.1735702, http:\/\/doi.acm.org\/10.1145\/1735688.1735702","key":"8_CR5","DOI":"10.1145\/1735688.1735702"},{"doi-asserted-by":"publisher","unstructured":"Davis, T.A., Hu, Y.: The university of florida sparse matrix collection. ACM Trans. Math. Softw. 38(1), 1:1\u20131:25 December 2011. https:\/\/doi.org\/10.1145\/2049662.2049663, http:\/\/doi.acm.org\/10.1145\/2049662.2049663","key":"8_CR6","DOI":"10.1145\/2049662.2049663"},{"doi-asserted-by":"publisher","unstructured":"Garc\u00eda, V., Gomez-Luna, J., Grass, T., Rico, A., Ayguade, E., Pena, A.J.: Evaluating the effect of last-level cache sharing on integrated GPU-CPU systems with heterogeneous applications. In: 2016 IEEE International Symposium on Workload Characterization (IISWC), pp. 1\u201310 September 2016. https:\/\/doi.org\/10.1109\/IISWC.2016.7581277","key":"8_CR7","DOI":"10.1109\/IISWC.2016.7581277"},{"key":"8_CR8","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"203","DOI":"10.1007\/978-3-319-52709-3_16","volume-title":"Languages and Compilers for Parallel Computing","author":"T Geng","year":"2017","unstructured":"Geng, T., et al.: The importance of efficient fine-grain synchronization for many-core systems. In: Ding, C., Criswell, J., Wu, P. (eds.) LCPC 2016. LNCS, vol. 10136, pp. 203\u2013217. Springer, Cham (2017). https:\/\/doi.org\/10.1007\/978-3-319-52709-3_16"},{"doi-asserted-by":"publisher","unstructured":"Lee, V.W., et al.: Debunking the 100x gpu vs. cpu myth: An evaluation of throughput computing on CPU and GPU. In: Proceedings of the 37th Annual International Symposium on Computer Architecture, pp. 451\u2013460. ISCA 2010, ACM, New York, USA (2010). https:\/\/doi.org\/10.1145\/1815961.1816021, http:\/\/doi.acm.org\/10.1145\/1815961.1816021","key":"8_CR9","DOI":"10.1145\/1815961.1816021"},{"unstructured":"Levon, J., Elie, P.: Oprofile: A system profiler for linux (2004)","key":"8_CR10"},{"unstructured":"List, T.S.: November 2017. http:\/\/www.top500.org","key":"8_CR11"},{"doi-asserted-by":"publisher","unstructured":"Luk, C.K., Hong, S., Kim, H.: Qilin: exploiting parallelism on heterogeneous multiprocessors with adaptive mapping. In: Proceedings of the 42Nd Annual IEEE\/ACM International Symposium on Microarchitecture, pp. 45\u201355. MICRO 42, ACM, New York, USA (2009). https:\/\/doi.org\/10.1145\/1669112.1669121, http:\/\/doi.acm.org\/10.1145\/1669112.1669121","key":"8_CR12","DOI":"10.1145\/1669112.1669121"},{"issue":"4","key":"8_CR13","first-page":"59","volume":"9","author":"T Lutz","year":"2013","unstructured":"Lutz, T., Fensch, C., Cole, M.: Partans: an autotuning framework for stencil computation on multi-GPU systems. ACM Trans. Arch. Code Optim. (TACO) 9(4), 59 (2013)","journal-title":"ACM Trans. Arch. Code Optim. (TACO)"},{"doi-asserted-by":"crossref","unstructured":"Margiolas, C., O\u2019Boyle, M.F.P.: Portable and transparent software managed scheduling on accelerators for fair resource sharing. In: 2016 IEEE\/ACM International Symposium on Code Generation and Optimization (CGO), pp. 82\u201393, March 2016","key":"8_CR14","DOI":"10.1145\/2854038.2854040"},{"doi-asserted-by":"publisher","unstructured":"O\u2019Boyle, M.F.P., Wang, Z., Grewe, D.: Portable mapping of data parallel programs to opencl for heterogeneous systems. In: Proceedings of the 2013 IEEE\/ACM International Symposium on Code Generation and Optimization (CGO). pp. 1\u201310. CGO 2013, IEEE Computer Society, Washington, DC, USA (2013). https:\/\/doi.org\/10.1109\/CGO.2013.6494993, http:\/\/dx.doi.org\/10.1109\/CGO.2013.6494993","key":"8_CR15","DOI":"10.1109\/CGO.2013.6494993"},{"doi-asserted-by":"publisher","unstructured":"Sant\u2019Ana, L., Cordeiro, D., Camargo, R.: PLB-HeC: a profile-based load-balancing algorithm for heterogeneous CPU-GPU clusters. In: 2015 IEEE International Conference on Cluster Computing, pp. 96\u2013105, September 2015. https:\/\/doi.org\/10.1109\/CLUSTER.2015.24","key":"8_CR16","DOI":"10.1109\/CLUSTER.2015.24"},{"key":"8_CR17","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"197","DOI":"10.1007\/978-3-030-29400-7_15","volume-title":"Euro-Par 2019: Parallel Processing","author":"L San\u2019Ana","year":"2019","unstructured":"San\u2019Ana, L., Cordeiro, D., de Camargo, R.Y.: PLB-HAC: dynamic load-balancing for heterogeneous accelerator clusters. In: Yahyapour, R. (ed.) Euro-Par 2019. LNCS, vol. 11725, pp. 197\u2013209. Springer, Cham (2019). https:\/\/doi.org\/10.1007\/978-3-030-29400-7_15"},{"key":"8_CR18","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"633","DOI":"10.1007\/978-3-642-40047-6_63","volume-title":"Euro-Par 2013 Parallel Processing","author":"J Suettlerlein","year":"2013","unstructured":"Suettlerlein, J., Zuckerman, S., Gao, G.R.: An implementation of the codelet model. In: Wolf, F., Mohr, B., an Mey, D. (eds.) Euro-Par 2013. LNCS, vol. 8097, pp. 633\u2013644. Springer, Heidelberg (2013). https:\/\/doi.org\/10.1007\/978-3-642-40047-6_63"},{"doi-asserted-by":"publisher","unstructured":"Tribbey, W.: Modern database systems. In: Kim, W. (ed.) Modern Database Systems, chap. Numerical Recipes: The Art of Scientific Computing (3rd Edition) is Written by William H. Press, Saul A. Teukolsky, William T. Vetterling, and Brian P. Flannery, and Published by Cambridge University Press, 2007, Hardback, pp. 30\u201331, ISBN 978-0-521-88068-8, 1235 Pp. ACM Press\/Addison-Wesley Publishing Co., New York, USA (1995). https:\/\/doi.org\/10.1145\/1874391.187410, http:\/\/dx.doi.org\/10.1145\/1874391.187410","key":"8_CR19","DOI":"10.1145\/1874391.187410"},{"doi-asserted-by":"publisher","unstructured":"Van Craeynest, K., Jaleel, A., Eeckhout, L., Narvaez, P., Emer, J.: Scheduling heterogeneous multi-cores through performance impact estimation (pie). SIGARCH Comput. Archit. News 40(3), 213\u2013224 (2012). https:\/\/doi.org\/10.1145\/2366231.2337184, http:\/\/doi.acm.org\/10.1145\/2366231.2337184","key":"8_CR20","DOI":"10.1145\/2366231.2337184"},{"doi-asserted-by":"publisher","unstructured":"Wang, Z., Tournavitis, G., Franke, B., O\u2019boyle, M.F.P.: Integrating profile-driven parallelism detection and machine-learning-based mapping. ACM Trans. Archit. Code Optim. 11(1), 1\u201326 (2014). https:\/\/doi.org\/10.1145\/2579561, http:\/\/doi.acm.org\/10.1145\/2579561","key":"8_CR21","DOI":"10.1145\/2579561"},{"doi-asserted-by":"publisher","unstructured":"Wen, Y., O\u2019Boyle, M.F.: Merge or separate?: multi-job scheduling for opencl kernels on CPU\/GPU platforms. In: Proceedings of the General Purpose GPUs, pp. 22\u201331. GPGPU-10, ACM, New York, USA (2017). https:\/\/doi.org\/10.1145\/3038228.3038235, http:\/\/doi.acm.org\/10.1145\/3038228.3038235","key":"8_CR22","DOI":"10.1145\/3038228.3038235"},{"doi-asserted-by":"publisher","unstructured":"Yang, C., et al.: Adaptive optimization for petascale heterogeneous CPU\/GPU computing. In: IEEE International Conference on Cluster Computing, pp. 19\u201328, September 2010). https:\/\/doi.org\/10.1109\/CLUSTER.2010.12","key":"8_CR23","DOI":"10.1109\/CLUSTER.2010.12"},{"doi-asserted-by":"publisher","unstructured":"Zhang, F., Wu, B., Zhai, J., He, B., Chen, W.: Finepar: irregularity-aware fine-grained workload partitioning on integrated architectures. In: 2017 IEEE\/ACM International Symposium on Code Generation and Optimization (CGO), pp. 27\u201338, Febuary 2017. https:\/\/doi.org\/10.1109\/CGO.2017.7863726","key":"8_CR24","DOI":"10.1109\/CGO.2017.7863726"},{"issue":"3","key":"8_CR25","doi-asserted-by":"publisher","first-page":"905","DOI":"10.1109\/TPDS.2016.2586074","volume":"28","author":"F Zhang","year":"2017","unstructured":"Zhang, F., Zhai, J., He, B., Zhang, S., Chen, W.: Understanding co-running behaviors on integrated CPU\/GPU architectures. IEEE TPDS 28(3), 905\u2013918 (2017). https:\/\/doi.org\/10.1109\/TPDS.2016.2586074","journal-title":"IEEE TPDS"},{"doi-asserted-by":"crossref","unstructured":"Zuckerman, S., Suetterlein, J., Knauerhase, R., Gao, G.R.: Using a \u201ccodelet\" program execution model for exascale machines: position paper. In: Proceedings of the 1st International Workshop on Adaptive Self-Tuning Computing Systems for the Exaflop Era. EXADAPT 2011, ACM, New York, USA (2011)","key":"8_CR26","DOI":"10.1145\/2000417.2000424"}],"container-title":["Lecture Notes in Computer Science","Job Scheduling Strategies for Parallel Processing"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-63171-0_8","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,4,24]],"date-time":"2021-04-24T12:12:35Z","timestamp":1619266355000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-63171-0_8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020]]},"ISBN":["9783030631703","9783030631710"],"references-count":26,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-63171-0_8","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2020]]},"assertion":[{"value":"16 November 2020","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"JSSPP","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Workshop on Job Scheduling Strategies for Parallel Processing","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"New Orleans, LA","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"USA","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2020","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"22 May 2020","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"22 May 2020","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"23","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"jsspp2020","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/jsspp.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Single-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Easychair","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"8","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"6","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"75% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3.8","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"2","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"The conference was held virtually due to the COVID-19 pandemic.","order":10,"name":"additional_info_on_review_process","label":"Additional Info on Review Process","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}