{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,29]],"date-time":"2025-11-29T07:55:19Z","timestamp":1764402919485,"version":"3.37.3"},"reference-count":53,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"1","license":[{"start":{"date-parts":[[2021,3,1]],"date-time":"2021-03-01T00:00:00Z","timestamp":1614556800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,3,1]],"date-time":"2021-03-01T00:00:00Z","timestamp":1614556800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,3,1]],"date-time":"2021-03-01T00:00:00Z","timestamp":1614556800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100000038","name":"Natural Sciences and Engineering Research Council of Canada","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100000038","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/100000183","name":"Army Research office","doi-asserted-by":"publisher","id":[{"id":"10.13039\/100000183","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Big Data"],"published-print":{"date-parts":[[2021,3,1]]},"DOI":"10.1109\/tbdata.2019.2908188","type":"journal-article","created":{"date-parts":[[2019,3,29]],"date-time":"2019-03-29T18:48:13Z","timestamp":1553885293000},"page":"115-127","source":"Crossref","is-referenced-by-count":14,"title":["Deadline-Aware Cost Optimization for Spark"],"prefix":"10.1109","volume":"7","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-6578-0114","authenticated-orcid":false,"given":"Subhajit","family":"Sidhanta","sequence":"first","affiliation":[]},{"given":"Wojciech","family":"Golab","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-0839-1133","authenticated-orcid":false,"given":"Supratik","family":"Mukhopadhyay","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"year":"2014","key":"ref39","article-title":"Apache Software Foundation, Apache hadoop nextgen MapReduce (yarn)"},{"article-title":"9 super-cool uses for supercomputers","year":"2015","author":"pappas","key":"ref38"},{"article-title":"SNAP datasets: Stanford large network dataset collection","year":"2014","author":"leskovec","key":"ref33"},{"year":"2003","key":"ref32"},{"article-title":"Spark programming guide","year":"2017","author":"foundation","key":"ref31"},{"key":"ref30","article-title":"Proving linearizability via branching bisimulation","author":"yang","year":"2016","journal-title":"CoRR"},{"year":"2015","key":"ref37","article-title":"Category archives: Use case"},{"article-title":"Powered by spark","year":"2015","author":"foundation","key":"ref36"},{"year":"2017","key":"ref35","article-title":"Deep learning pipelines for apache spark"},{"year":"2008","key":"ref34"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1007\/s10009-012-0244-z"},{"article-title":"Optex job claassifier and model generator","year":"2018","author":"sidhanta","key":"ref27"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-31980-1_42"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1145\/2038916.2038934"},{"journal-title":"Amazon Elastic Compute Cloud (Amazon EC2)","year":"2008","key":"ref1"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.2168\/LMCS-11(4:16)2015"},{"key":"ref22","first-page":"309","article-title":"Bisimulations on data graphs","author":"abriola","year":"2016","journal-title":"Proc 15th Int Conf Principles Knowl Representation Reasoning"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1016\/0022-0000(87)90025-0"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-23702-7_22"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1007\/3-540-45022-X_29"},{"article-title":"Statlib data and story library (DASL)","year":"1996","author":"chase","key":"ref26"},{"journal-title":"Numerical Analysis and Scientific Computation","year":"2004","author":"leader","key":"ref25"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1145\/1807128.1807136"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/TSC.2011.7"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1016\/j.future.2011.05.027"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/ICAC.2005.27"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1145\/2783258.2789993"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1007\/s41060-016-0027-9"},{"key":"ref40","first-page":"293","article-title":"Making sense of performance in data analytics frameworks","author":"ousterhout","year":"2015","journal-title":"Proc 12th USENIX Conf Netw Syst Des Implementation"},{"article-title":"How to track shopping cart abandonment in Google analytics","year":"2017","author":"centenaro","key":"ref12"},{"article-title":"Netflix at spark+ai summit 2018","year":"2018","author":"siddiqi","key":"ref13"},{"year":"2018","key":"ref14","article-title":"Tutorial: Introduction to apache spark"},{"article-title":"OptEx: Deadline-aware cost optimization for spark","year":"2018","author":"sidhanta","key":"ref15"},{"article-title":"Apache spark libraries","year":"2015","author":"foundation","key":"ref16"},{"key":"ref17","first-page":"481","article-title":"An algebraic definition of simulation between programs","author":"milner","year":"1971","journal-title":"Proc 2nd Int Joint Conf Artif Intell"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1007\/BFb0017309"},{"journal-title":"Communicating and Mobile Systems The &Pgr -calculus","year":"1999","author":"milner","key":"ref19"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/CCGrid.2014.101"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1145\/1998582.1998637"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/UCC.2013.40"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CloudCom.2010.97"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CCGrid.2016.10"},{"key":"ref7","first-page":"4","article-title":"Towards a model for cloud computing cost estimation with reserved instances","author":"singer","year":"2010","journal-title":"Proc Int Conf Cloud Comput"},{"key":"ref49","first-page":"337","article-title":"Energy-aware server provisioning and load dispatching for connection-intensive internet services","author":"chen","year":"2008","journal-title":"Proc 5th USENIX Symp Netw Syst Des Implementation"},{"key":"ref9","first-page":"2","article-title":"Resilient distributed datasets: A fault-tolerant abstraction for in-memory cluster computing","author":"zaharia","year":"2012","journal-title":"Proc 9th USENIX Conf Netw Syst Des Implementation"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-63390-9_15"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-33078-0_30"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/TCC.2017.2702661"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1145\/2517349.2522739"},{"key":"ref42","first-page":"219","article-title":"DeepDive: Transparently identifying and managing performance interference in virtualized environments","author":"novakovi?","year":"2013","journal-title":"Proc USENIX Conf Annu Tech Conf"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/TSC.2012.2"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/ICCAD.2017.8203853"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/IISWC.2012.6402895"}],"container-title":["IEEE Transactions on Big Data"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/6687317\/9366322\/08676267.pdf?arnumber=8676267","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,5,10]],"date-time":"2022-05-10T14:54:06Z","timestamp":1652194446000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/8676267\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,3,1]]},"references-count":53,"journal-issue":{"issue":"1"},"URL":"https:\/\/doi.org\/10.1109\/tbdata.2019.2908188","relation":{},"ISSN":["2332-7790","2372-2096"],"issn-type":[{"type":"electronic","value":"2332-7790"},{"type":"electronic","value":"2372-2096"}],"subject":[],"published":{"date-parts":[[2021,3,1]]}}}