{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,16]],"date-time":"2025-10-16T10:01:39Z","timestamp":1760608899834,"version":"3.41.0"},"reference-count":109,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2015,10,29]],"date-time":"2015-10-29T00:00:00Z","timestamp":1446076800000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"crossref","award":["51208538"],"award-info":[{"award-number":["51208538"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Parallel Prog"],"published-print":{"date-parts":[[2016,8]]},"DOI":"10.1007\/s10766-015-0395-0","type":"journal-article","created":{"date-parts":[[2015,10,29]],"date-time":"2015-10-29T03:49:58Z","timestamp":1446090598000},"page":"832-866","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":50,"title":["MapReduce Parallel Programming Model: A State-of-the-Art Survey"],"prefix":"10.1007","volume":"44","author":[{"given":"Ren","family":"Li","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Haibo","family":"Hu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Heng","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yunsong","family":"Wu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jianxi","family":"Yang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2015,10,29]]},"reference":[{"issue":"2","key":"395_CR1","doi-asserted-by":"crossref","first-page":"281","DOI":"10.1007\/s10723-013-9255-6","volume":"11","author":"J Shamsi","year":"2013","unstructured":"Shamsi, J., Khojaye, M.A., Qasmi, M.A.: Data-intensive cloud computing: requirement, expectations, challenges and solutions. J. Grid Comput. 11(2), 281\u2013310 (2013)","journal-title":"J. Grid Comput."},{"issue":"1","key":"395_CR2","first-page":"146","volume":"50","author":"X Meng","year":"2013","unstructured":"Meng, X., Ci, X.: Big data management: concepts, techniques and challenges. J. Comput. Res. Dev. 50(1), 146\u2013169 (2013)","journal-title":"J. Comput. Res. Dev."},{"issue":"10","key":"395_CR3","doi-asserted-by":"crossref","first-page":"1741","DOI":"10.3724\/SP.J.1016.2011.01741","volume":"34","author":"S Wang","year":"2013","unstructured":"Wang, S., Wang, H., Qin, X., Zhou, X.: Architecting big data: challenges, studies and forecasts. Chin. J. Comput. 34(10), 1741\u20131752 (2013)","journal-title":"Chin. J. Comput."},{"key":"395_CR4","unstructured":"Mell, P., Grance, T.: Definition of Cloud Computing. Technical report, National Institute of Standards and Technology (NIST) (2009)"},{"issue":"3","key":"395_CR5","doi-asserted-by":"crossref","first-page":"311","DOI":"10.1109\/SURV.2011.032211.00087","volume":"13","author":"S Sakr","year":"2011","unstructured":"Sakr, S., Liu, A., Batista, D.M., Alomari, M.: A survey of large scale data management approaches in cloud environments. IEEE Commun. Surv. Tutor. 13(3), 311\u2013336 (2011)","journal-title":"IEEE Commun. Surv. Tutor."},{"issue":"1","key":"395_CR6","doi-asserted-by":"crossref","first-page":"107","DOI":"10.1145\/1327452.1327492","volume":"51","author":"J Dean","year":"2008","unstructured":"Dean, J., Ghemawat, S.: MapReduce: simplified data processing on large clusters. Commun. ACM 51(1), 107\u2013133 (2008)","journal-title":"Commun. ACM"},{"key":"395_CR7","doi-asserted-by":"crossref","unstructured":"Ghemawat, S., Gobioff, H., Leung, S.-T.: The Google file system. In: Proceedings of 19th ACM Symposium on Operating Systems Principles, pp. 29\u201343. ACM (2003)","DOI":"10.1145\/945445.945450"},{"issue":"5","key":"395_CR8","doi-asserted-by":"crossref","first-page":"82","DOI":"10.1109\/MIS.2008.94","volume":"23","author":"P Mika","year":"2008","unstructured":"Mika, P., Tummarello, G.: Web semantics in the clouds. IEEE Intell. Syst. 23(5), 82\u201387 (2008)","journal-title":"IEEE Intell. Syst."},{"key":"395_CR9","unstructured":"Apache Hadoop. http:\/\/hadoop.apache.org\/ . Accessed Oct. 2014"},{"key":"395_CR10","doi-asserted-by":"crossref","unstructured":"Olston, C., Reed, B., Srivastava, U., Kumar, R., Tomkins, A.: PigLatin: a not-so-foreign language for data processing. In: Proceedings of ACM SIGMOD International Conference of Management of Data (2008)","DOI":"10.1145\/1376616.1376726"},{"key":"395_CR11","unstructured":"Mahou. http:\/\/mahout.apache.org\/ . Accessed Oct 2014"},{"key":"395_CR12","doi-asserted-by":"crossref","first-page":"59","DOI":"10.1016\/j.websem.2011.05.004","volume":"10","author":"J Urbani","year":"2012","unstructured":"Urbani, J., Kotoulas, S., Maassen, J., Harmelen, F.V., Bal, H.: WebPIE: a web-scale parallel inference engine using mapreduce. J. Web Semant. 10, 59\u201375 (2012)","journal-title":"J. Web Semant."},{"issue":"5","key":"395_CR13","doi-asserted-by":"crossref","first-page":"34","DOI":"10.1038\/scientificamerican0501-34","volume":"284","author":"T Berners-Lee","year":"2001","unstructured":"Berners-Lee, T., Hendler, J., Lassila, O.: The Semantic Web. Sci. Am. 284(5), 34\u201343 (2001)","journal-title":"Sci. Am."},{"issue":"10","key":"395_CR14","doi-asserted-by":"crossref","first-page":"1785","DOI":"10.3724\/SP.J.1016.2011.01785","volume":"34","author":"L Ding","year":"2011","unstructured":"Ding, L., Xin, J., Wang, G., Huang, S.: Efficient skyline query processing of massive data based on MapReduce. Chin. J. Comput. 34(10), 1785\u20131796 (2011)","journal-title":"Chin. J. Comput."},{"issue":"3","key":"395_CR15","doi-asserted-by":"crossref","first-page":"355","DOI":"10.1007\/s00778-013-0319-9","volume":"23","author":"C Doulkeridis","year":"2014","unstructured":"Doulkeridis, C., N\u00f8rv\u00e5g, K.: A survey of large-scale analytical query processing in MapReduce. VLDB J. 23(3), 355\u2013380 (2014)","journal-title":"VLDB J."},{"issue":"3","key":"395_CR16","first-page":"31","volume":"46","author":"F Li","year":"2014","unstructured":"Li, F., Ooi, B.C., \u00d6zsu, M.T., Wu, S.: Distributed data management using MapReduce. ACM Comput. Surv. 46(3), 31 (2014)","journal-title":"ACM Comput. Surv."},{"issue":"4","key":"395_CR17","first-page":"11","volume":"40","author":"KH Lee","year":"2011","unstructured":"Lee, K.H., Lee, Y.J., Choi, H., Chung, Y.D., Moon, B.: Parallel data processing with MapReduce: a survey. ACM SIGMOD Rec. 40(4), 11\u201320 (2011)","journal-title":"ACM SIGMOD Rec."},{"issue":"1","key":"395_CR18","doi-asserted-by":"crossref","first-page":"72","DOI":"10.1145\/1629175.1629198","volume":"53","author":"J Dean","year":"2010","unstructured":"Dean, J., Ghemawat, S.: MapReduce: a flexible data processing tool. Commun. ACM 53(1), 72\u201377 (2010)","journal-title":"Commun. ACM"},{"key":"395_CR19","unstructured":"Van Biema, M.: Parallelism in Lisp. In: IJCAI87, pp. 56\u201361 (1987)"},{"key":"395_CR20","unstructured":"QT Concurrent. http:\/\/doc.qt.io\/qt-5\/qtconcurrent-index.html . Accessed Oct 2015"},{"key":"395_CR21","doi-asserted-by":"crossref","unstructured":"Ranger, C., Raghuraman, R., Penmetsa, A., Bradski, G., Kozyrakis, C.: Evaluating MapReduce for multi-core and multiprocessor systems. In: Proceedings of IEEE 13th International Symposium on High Performance Computer Architecture, pp. 13\u201324 (2007)","DOI":"10.1109\/HPCA.2007.346181"},{"key":"395_CR22","doi-asserted-by":"crossref","unstructured":"Talbot, J., Yoo, R.M., Kozyrakis, C.: Phoenix++: modular mapreduce for shared-memory systems. In: Proceedings of 2nd International Workshop on MapReduce and Its Applications, pp. 9\u201316 (2011)","DOI":"10.1145\/1996092.1996095"},{"key":"395_CR23","unstructured":"Disco massive data\u2014minimal code. http:\/\/discoproject.org\/ . Accessed Oct 2014"},{"key":"395_CR24","unstructured":"Geni, Skynet A Ruby MapReduce Framework. http:\/\/skynet.rubyforge.org\/ . Accessed Oct 2014"},{"key":"395_CR25","unstructured":"GridGain. http:\/\/www.gridgain.com\/ . Accessed Oct 2014"},{"key":"395_CR26","doi-asserted-by":"crossref","unstructured":"Ekanayake, J., Li, H., Zhang, B., Gunarathne, T., Bae, S.-H., Qiu, J., Fox, G.: Twister: a runtime for iterative MapReduce. In: Proceedings of First International Workshop on MapReduce and Its Applications of ACM, pp. 810\u2013818. ACM (2010)","DOI":"10.1145\/1851476.1851593"},{"key":"395_CR27","doi-asserted-by":"crossref","unstructured":"Dou, A.J., Kalogeraki, V., Gunopulos, D., Mielikainen, T., Tuulos, V.: Misco: a MapReduce Framework for mobile systems. In: Proceedings of 3rd International Conference on Pervasive Technologies Related to Assistive Environment (2010)","DOI":"10.1145\/1839294.1839332"},{"key":"395_CR28","unstructured":"DeWitt, D., Stonebraker, M.: MapReduce: a major step backwards. The Database Column 1 (2008)"},{"key":"395_CR29","doi-asserted-by":"crossref","unstructured":"Sun, X., He, C., Lu, Y.: ESAMR: an enhanced self-adaptive MapReduce scheduling algorithm. In: Proceedings of the 2012 IEEE 18th International Conference on Parallel and Distributed Systems, pp. 148\u2013155 (2012)","DOI":"10.1109\/ICPADS.2012.30"},{"issue":"9","key":"395_CR30","doi-asserted-by":"crossref","first-page":"1312","DOI":"10.1109\/TKDE.2011.103","volume":"23","author":"MF Husain","year":"2011","unstructured":"Husain, M.F., McGlothlin, J., Masud, M.M., Khan, L.R., Thuraisingham, B.: Heuristics-based query processing for large RDF graphs using cloud computing. IEEE Trans. Knowl. Data Eng. 23(9), 1312\u20131327 (2011)","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"395_CR31","doi-asserted-by":"crossref","unstructured":"Sandholm, T., Lai, K.: MapReduce optimization using regulated dynamic prioritization. In: Proceedings of the 11th International Joint Conference on Measurement and Modeling of Computer Systems, pp. 299\u2013310 (2009)","DOI":"10.1145\/1555349.1555384"},{"key":"395_CR32","doi-asserted-by":"crossref","unstructured":"Seo, S., Jang, I., Woo, K., Kim, I., Kim, J.-S., Maeng, S.: HPMR: prefetching and pre-shuffling in shared MapReduce computation environment. In: Proceedings of 2009 IEEE International Conference on Cluster Computing and Workshops (2009)","DOI":"10.1109\/CLUSTR.2009.5289171"},{"key":"395_CR33","doi-asserted-by":"crossref","unstructured":"Polo, J., Carrera, D., Becerra, Y., Torres, J., Ayguade, E., Steinder, M., Whalley, I.: Performance-driven task co-scheduling for MapReduce environments. In: Proceedings of 12th IEEE\/IFIP Network Operations and Management Symposium, pp. 373\u2013380 (2010)","DOI":"10.1109\/NOMS.2010.5488494"},{"key":"395_CR34","doi-asserted-by":"crossref","unstructured":"Polo, J., Carrera, D., Becerra, Y., Beltran, V., Torres, J., Ayguade, E.: Performance management of accelerated MapReduce workloads in heterogeneous clusters. In: Proceedings of 39th International Conference on Parallel Processing, pp. 653\u2013662 (2010)","DOI":"10.1109\/ICPP.2010.73"},{"key":"395_CR35","doi-asserted-by":"crossref","unstructured":"Zaharia, M., Borthakur, D., Sarma, J.S., Elmeleegy, K., Shenker, S., Stoica, I.: Delay scheduling: a simple technique for achieving locality and fairness in cluster scheduling. In: EuroSyst, pp. 265\u2013278 (2010)","DOI":"10.1145\/1755913.1755940"},{"key":"395_CR36","unstructured":"Yao, Y., Tai, J., Sheng, B., Mi, N.: Scheduling heterogeneous MapReduce jobs for efficiency improvement in enterprise clusters. In: Proceedings of 2013 IFIP\/IEEE International Symposium on Integrated Network Management, pp. 872\u2013875 (2013)"},{"key":"395_CR37","unstructured":"Zaharia, M., Konwinski, A., Joseph, A. D., Katz, R., Stoica, I.: Improving MapReduce performance in heterogeneous environments. In: Proceedings of 8th USENIX Symposium on Operating System Design and Implementation, pp. 29\u201342 (2008)"},{"key":"395_CR38","doi-asserted-by":"crossref","unstructured":"Chen, Q., Zhang, D., Guo, M., Deng, Q., Guo, S.: SAMR: A self-adaptive MapReduce scheduling algorithm in heterogeneous environment. In: Proceedings of 10th IEEE International Conference on Computer and Information Technology, CIT-2010, 7th IEEE International Conference on Embedded Software and Systems, ICESS-2010, 10th IEEE International Conference on Scalable Computing and Communications, pp. 2736\u20132743 (2010)","DOI":"10.1109\/CIT.2010.458"},{"issue":"3","key":"395_CR39","doi-asserted-by":"crossref","first-page":"1038","DOI":"10.1007\/s11227-011-0682-5","volume":"64","author":"Q Chen","year":"2013","unstructured":"Chen, Q., Guo, M.Y., Deng, Q.N., Zheng, L., Guo, S., Shen, Y.: HAT: history-based auto-tuning MapReduce in heterogeneous environments. J. Supercomput. 64(3), 1038\u20131054 (2013)","journal-title":"J. Supercomput."},{"key":"395_CR40","doi-asserted-by":"crossref","unstructured":"Zhang, X., Feng, Y., Feng, S., Fan, J., Ming, Z.: An effective data locality aware task scheduling method for MapReduce framework in heterogeneous environments. In: Proceedings of 2011 International Conference on Cloud and Service Computing, pp. 235\u2013242 (2011)","DOI":"10.1109\/CSC.2011.6138527"},{"key":"395_CR41","doi-asserted-by":"crossref","unstructured":"Ahmad, F., Chakradhar, S.T., Raghunathan, A., Vijaykumar, T.N.: Tarazu: optimizing MapReduce on heterogeneous clusters. In: Proceedings of 17th International Conference on Architectural Support for Programming Languages and Operating Systems, pp. 61\u201374 (2011)","DOI":"10.1145\/2150976.2150984"},{"issue":"5","key":"395_CR42","first-page":"1096","volume":"8","author":"Y Yang","year":"2013","unstructured":"Yang, Y., Shi, B., Jiang, B., Xiang, L.: Data-replicas scheduler for heterogeneous MapReduce cluster. J. Netw. 8(5), 1096\u20131103 (2013)","journal-title":"J. Netw."},{"issue":"1","key":"395_CR43","doi-asserted-by":"crossref","first-page":"158","DOI":"10.1109\/TPDS.2012.88","volume":"24","author":"S Sehrish","year":"2013","unstructured":"Sehrish, S., Mackey, G., Shang, P.J., Wang, J., Bent, J.: Supporting HPC analytics applications with access patterns using data restructuring and data-centric scheduling techniques in MapReduce. IEEE Trans. Parallel Distrib. Syst. 24(1), 158\u2013169 (2013)","journal-title":"IEEE Trans. Parallel Distrib. Syst."},{"key":"395_CR44","unstructured":"Peng, D., Dabek, F., Inc, G.: Large-scale incremental processing using distributed transactions and notifications. In: Usenix Symposium on Operating Systems Design & Implementation, pp. 4\u20136 (2010)"},{"key":"395_CR45","doi-asserted-by":"crossref","unstructured":"Bu, X., Rao, J., Xu, C.: Interference and locality-aware task scheduling for MapReduce applications in virtual clusters. In: Proceedings of the 22nd ACM International Symposium on High-Performance Parallel and Distributed Computing, pp. 227\u2013238 (2013)","DOI":"10.1145\/2493123.2462904"},{"key":"395_CR46","doi-asserted-by":"crossref","unstructured":"Yang, H.-C., Dasdan, A., Hsiao, R.-L., Parker, D.S.: Map-Reduce-Merge: simplified relational data processing on large clusters. In: Proceedings of ACM SIGMOD International Conference on Management of Data, pp. 1029\u20131040 (2007)","DOI":"10.1145\/1247480.1247602"},{"issue":"9","key":"395_CR47","doi-asserted-by":"crossref","first-page":"1299","DOI":"10.1109\/TKDE.2010.248","volume":"23","author":"D Jiang","year":"2011","unstructured":"Jiang, D., Tung, A.K.H., Chen, G.: Map\u2013Join\u2013Reduce: toward scalable and efficient data analysis on large clusters. IEEE Trans. Knowl. Data Eng. 23(9), 1299\u20131311 (2011)","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"395_CR48","doi-asserted-by":"crossref","unstructured":"Ferrera, P., de Prado, I., Palacios, E., Fernandez-Marquez, J.L., Serugendo, G.D.: Tuple MapReduce: beyond classic MapReduce. In: Proceedings of 12th IEEE International Conference on Data Mining, pp. 260\u2013269 (2012)","DOI":"10.1109\/ICDM.2012.141"},{"key":"395_CR49","doi-asserted-by":"crossref","unstructured":"Vu, T.-T., Huet, F.: A lightweight continuous jobs mechanism for MapReduce frameworks. In: Proceedings of 13th IEEE\/ACM International Symposium on Cluster, Cloud, and Grid Computing, pp. 269\u2013276 (2013)","DOI":"10.1109\/CCGrid.2013.36"},{"issue":"2","key":"395_CR50","doi-asserted-by":"crossref","first-page":"185","DOI":"10.1002\/int.21563","volume":"28","author":"W Premchaiswadi","year":"2013","unstructured":"Premchaiswadi, W., Pomsaiyud, W.: Optimizing and tuning MapReduce jobs to improve the large-scale data analysis process. Int. J. Intell. Syst. 28(2), 185\u2013200 (2013)","journal-title":"Int. J. Intell. Syst."},{"issue":"1","key":"395_CR51","doi-asserted-by":"crossref","first-page":"285","DOI":"10.14778\/1920841.1920881","volume":"3","author":"Y Bu","year":"2010","unstructured":"Bu, Y., Howe, B., Balazinska, M., Ernst, M.D.: Haloop: efficient iterative data processing on large clusters. Proc. VLDB Endow. 3(1), 285\u2013296 (2010)","journal-title":"Proc. VLDB Endow."},{"key":"395_CR52","doi-asserted-by":"crossref","unstructured":"Kambatla, K., Rapolu, N., Jagannathan, S., Grama, A.: Asynchronous algorithms in MapReduce. In: Proceedings of 2010 IEEE International Conference on Cluster Computing, Cluster, pp. 245\u2013254 (2010)","DOI":"10.1109\/CLUSTER.2010.30"},{"key":"395_CR53","doi-asserted-by":"crossref","unstructured":"Elnikety, E., Elsayed, T., Ramadan, H.E.: IHadoop: asynchronous iterations for MapReduce. In: Proceedings of 2011 3rd IEEE International Conference on Cloud Computing Technology and Science, pp. 81\u201390 (2011)","DOI":"10.1109\/CloudCom.2011.21"},{"key":"395_CR54","doi-asserted-by":"crossref","unstructured":"Wang, L., Ni, Z., Zhang, Y., Wu, Z., Tang, L.: Pipelined-MapReduce: an improved MapReduce parallel programming model. In: Proceedings of 4th International Conference on Intelligent Computation Technology and Automation, pp. 871\u2013874 (2011)","DOI":"10.1109\/ICICTA.2011.593"},{"key":"395_CR55","doi-asserted-by":"crossref","unstructured":"Xu, W., Gong, X.J., Li, X.Y.: MapCombine: a lightweight solution to improve the efficiency of iterative MapReduce. In: Proceedings of iCETS 2012, pp. 444\u2013456","DOI":"10.1007\/978-3-642-34447-3_40"},{"issue":"1","key":"395_CR56","doi-asserted-by":"crossref","first-page":"47","DOI":"10.1007\/s10723-012-9204-9","volume":"10","author":"YF Zhang","year":"2012","unstructured":"Zhang, Y.F., Gao, Q.X., Gao, L.X., Wang, C.R.: iMapReduce: a distributed computing framework for iterative computation. J. Grid Comput. 10(1), 47\u201368 (2012)","journal-title":"J. Grid Comput."},{"key":"395_CR57","unstructured":"Zaharia, M., Chowdhury, M., Das, T., Dave, A., Ma, J., Mccauley, M., Franklin, M., Shenker, S., Stoica, I.: Resilient Distributed Datasets: A Fault-Tolerant Abstraction for In-Memory Cluster Computing. In: USENIX Symposium on Networked Systems Design and Implementation, vol. 70, pp. 141\u2013146 (2012)"},{"issue":"4","key":"395_CR58","doi-asserted-by":"crossref","first-page":"1035","DOI":"10.1016\/j.future.2012.05.027","volume":"29","author":"T Gunarathne","year":"2013","unstructured":"Gunarathne, T., Zhang, B.J., Wu, T.L., Qiu, J.: Scalable parallel computing on clouds using Twister4Azure iterative MapReduce. Future Gener. Comput. Syst. 29(4), 1035\u20131048 (2013)","journal-title":"Future Gener. Comput. Syst."},{"key":"395_CR59","unstructured":"Condie, T., Conway, N., Alvaro, P., Hellerstein, M., Elmeleegy, K., Sears, R.: MapReduce Online. EECS Department, University of California, Berkeley. Tech. Rep. http:\/\/www.eecs.berkeley.edu\/Pubs\/TechRpts\/2009\/EECS-2009-136.html"},{"key":"395_CR60","doi-asserted-by":"crossref","unstructured":"B\u00f6se, J. H., Andrzejak, A., Hogqvist, M.: Beyond online aggregation: Parallel and incremental data mining with online Map-Reduce. In: Proceedings of 2010 Workshop on Massive Data Analytics on the Cloud, MDAC 2010, in Association with the 19th Annual World Wide Web Conference (2010)","DOI":"10.1145\/1779599.1779602"},{"key":"395_CR61","unstructured":"Phan, L.T.X., Zhang, Z., Loo, B.T., Lee, I.: Real-Time MapReduce Scheduling. Technical Report, University of Pennsylvania (2010)"},{"key":"395_CR62","doi-asserted-by":"crossref","unstructured":"Dou, A.J., Kalogeraki, V., Gunopulos, D., Mielikainen, T., Tuulos, V.: Scheduling for real-time mobile MapReduce systems. In: Proceedings of the 5th ACM International Conference on Distributed Event-Based Systems, pp. 247\u2013258 (2011)","DOI":"10.1145\/2002259.2002305"},{"key":"395_CR63","doi-asserted-by":"crossref","unstructured":"Peng, C.-Z., Jiang, Z.-J., Cai, X.-B., Zhang, Z.-K.: Real-time analytics processing with MapReduce. In: Proceedings of 2012 International Conference on Machine Learning and Cybernetics, vol. 4, pp. 1308\u20131311 (2012)","DOI":"10.1109\/ICMLC.2012.6359554"},{"issue":"3","key":"395_CR64","doi-asserted-by":"crossref","first-page":"477","DOI":"10.3724\/SP.J.1016.2012.00477","volume":"35","author":"K Qi","year":"2012","unstructured":"Qi, K., Zhao, Z., Fang, J., Ma, Q.: Real-time processing for high speed data stream over large scale data. Chin. J. Comput. 35(3), 477\u2013490 (2012)","journal-title":"Chin. J. Comput."},{"key":"395_CR65","unstructured":"Zaharia, M., Chowdhury, M., Franklin, M.J., Shenker, S., Stoica, I.: Spark: cluster computing with working sets. In: Proceedings of the 2nd USENIX Conference on Hot Topics in Cloud Computing (2010)"},{"key":"395_CR66","doi-asserted-by":"crossref","unstructured":"Hong, C., Chen, D., Chen, W., Zheng, W., Lin, H.: MapCG: Writing parallel program portable between CPU and GPU. In: Proceedings of 19th International Conference on Parallel Architecture and Compilation Techniques, pp. 217\u2013226 (2010)","DOI":"10.1145\/1854273.1854303"},{"key":"395_CR67","doi-asserted-by":"crossref","unstructured":"Jiang, W., Ravi, V.T., Agrawal, G.: A Map-reduce system with an Alternate API for multi-core environments. In: Proceedings of 10th IEEE\/ACM International Symposium on Cluster, Cloud, and Grid Computing, pp. 84\u201393 (2010)","DOI":"10.1109\/CCGRID.2010.10"},{"key":"395_CR68","doi-asserted-by":"crossref","unstructured":"Stuart, J.A., Chen, C.-K., Ma, K.-L., Owens, J.D.: Multi-GPU volume rendering using MapReduce. In: Proceedings of 19th ACM International Symposium on High Performance Distributed Computing, pp. 841\u2013848 (2010)","DOI":"10.1145\/1851476.1851597"},{"issue":"4","key":"395_CR69","doi-asserted-by":"crossref","first-page":"608","DOI":"10.1109\/TPDS.2010.158","volume":"22","author":"W Fang","year":"2011","unstructured":"Fang, W., He, B., Luo, Q., Govindaraju, N.K.: Mars: accelerating MapReduce with graphics processors. IEEE Trans. Parallel Distrib. Syst. 22(4), 608\u2013620 (2011)","journal-title":"IEEE Trans. Parallel Distrib. Syst."},{"key":"395_CR70","doi-asserted-by":"crossref","unstructured":"Elteir, M., Lin, H., Feng, W.-C., Scogland, T.: StreamMR: an optimized MapReduce framework for AMD GPUs. In: Proceedings of 17th IEEE International Conference on Parallel and Distributed Systems, pp. 364\u2013371 (2011)","DOI":"10.1109\/ICPADS.2011.131"},{"key":"395_CR71","doi-asserted-by":"crossref","unstructured":"Chen, L., Agrawal, G.: Optimizing MapReduce for GPUs with effective shared memory usage. In: Proceedings of 21st ACM Symposium on High-Performance Parallel and Distributed Computing, pp. 199\u2013210 (2012)","DOI":"10.1145\/2287076.2287109"},{"issue":"4","key":"395_CR72","doi-asserted-by":"crossref","first-page":"522","DOI":"10.1016\/j.jpdc.2013.01.004","volume":"73","author":"C Basaran","year":"2013","unstructured":"Basaran, C., Kang, K.D.: Grex: an efficient MapReduce framework for graphics processing units. J. Parallel Distrib. Comput. 73(4), 522\u2013533 (2013)","journal-title":"J. Parallel Distrib. Comput."},{"key":"395_CR73","first-page":"1","volume":"10","author":"R Chen","year":"2013","unstructured":"Chen, R., Chen, H.: Tiled-mapreduce: efficient and flexible mapreduce processing on multicore with tiling. Trans. Archit. Code Optim. 10, 1 (2013)","journal-title":"Trans. Archit. Code Optim."},{"issue":"5","key":"395_CR74","doi-asserted-by":"crossref","first-page":"10:1","DOI":"10.1147\/JRD.2009.5429076","volume":"53","author":"M Krujif de","year":"2009","unstructured":"de Krujif, M., Sankaralingam, K.: MapReduce for the Cell B.E. architecture. IBM J. Res. Dev. 53(5), 10:1\u201310:12 (2009)","journal-title":"IBM J. Res. Dev."},{"key":"395_CR75","doi-asserted-by":"crossref","first-page":"25","DOI":"10.1145\/1531793.1531800","volume":"43","author":"MM Rafique","year":"2009","unstructured":"Rafique, M.M., Rose, B., Butt, A.R., Nikolopoulos, D.S.: Supporting MapReduce on large-scale asymmetric multi-core clusters. Oper. Syst. Rev. 43, 25\u201334 (2009)","journal-title":"Oper. Syst. Rev."},{"key":"395_CR76","doi-asserted-by":"crossref","unstructured":"Papagiannis, A., Nikolopoulos, D.S.: Rearchitecting MapReduce for heterogeneous multicore processors with explicitly managed memories. In: Proceedings of 39th International Conference on Parallel Processing, pp. 121\u2013130 (2010)","DOI":"10.1109\/ICPP.2010.21"},{"key":"395_CR77","doi-asserted-by":"crossref","unstructured":"He, C., Weitzel, D., Swanson, D., Lu, Y.: HOG: Distributed Hadoop MapReduce on the grid. In: Proceedings of 2012 SC Companion: High Performance Computing, Networking Storage and Analysis, pp. 1276\u20131283 (2012)","DOI":"10.1109\/SC.Companion.2012.154"},{"key":"395_CR78","doi-asserted-by":"crossref","unstructured":"Heintz, B., Wang, C., Chandra, A., Weissman, J.: Cross-phase optimization in mapreduce. In: Proceedings of 1st IEEE International Conference on Cloud Engineering, pp. 338\u2013347 (2013)","DOI":"10.1109\/IC2E.2013.26"},{"issue":"3","key":"395_CR79","doi-asserted-by":"crossref","first-page":"739","DOI":"10.1016\/j.future.2012.09.001","volume":"29","author":"L Wang","year":"2013","unstructured":"Wang, L., Tao, J., Ranjan, R., Marten, H., Streit, A., Chen, J., Chen, D.: G-Hadoop: MapReduce across distributed data centers for data-intensive computing. Future Gener. Comput. Syst. 29(3), 739\u2013750 (2013)","journal-title":"Future Gener. Comput. Syst."},{"key":"395_CR80","doi-asserted-by":"crossref","unstructured":"Mantha, P.K., Luckow, A., Jha, S.: Pilot-MapReduce: an extensible and flexible MapReduce implementation for distributed data. In: Proceedings of 2012 3rd International Workshop on MapReduce and Its Applications, pp. 17\u201324 (2012)","DOI":"10.1145\/2287016.2287020"},{"issue":"5","key":"395_CR81","doi-asserted-by":"crossref","first-page":"1382","DOI":"10.1016\/j.jcss.2011.12.021","volume":"78","author":"F Marozzo","year":"2012","unstructured":"Marozzo, F., Talia, D., Trunfio, P.: P2P-MapReduce: parallel data processing in dynamic cloud environments. J. Comput. Syst. Sci. 78(5), 1382\u20131402 (2012)","journal-title":"J. Comput. Syst. Sci."},{"key":"395_CR82","doi-asserted-by":"crossref","unstructured":"Wang, G., Butt, A.R., Pandey, P., Gupta, K.: Using realistic simulation for performance analysis of MapReduce setups. In: Proceedings of 1st ACM Workshop on Large-Scale System and Application Performance, pp. 16\u201329 (2009)","DOI":"10.1145\/1552272.1552278"},{"key":"395_CR83","doi-asserted-by":"crossref","unstructured":"Hammoud, S., Li, M., Liu, Y., Alham, N.K., Liu, Z.: MRSim: a discrete event based MapReduce simulator. In: Proceedings of 2010 Seventh International Conference on Fuzzy Systems and Knowledge Discovery, pp. 2993\u20132997 (2010)","DOI":"10.1109\/FSKD.2010.5569086"},{"key":"395_CR84","doi-asserted-by":"crossref","unstructured":"Huang, D., Shi, X., Ibrahim, S., Lu, L., Liu, H., Wu, S., Jin, H.: MR-Scope: a real-time tracing tool for MapReduce. In: Proceedings of 19th ACM International Symposium on High Performance Distributed Computing, pp. 849\u2013855 (2010)","DOI":"10.1145\/1851476.1851598"},{"key":"395_CR85","doi-asserted-by":"crossref","unstructured":"Teng, F., Yu, L., Magoules, F.: SimMapReduce: a simulator for modeling MapReduce framework. In: Proceedings of the 2011 5th FTRA International Conference on Multimedia and Ubiquitous Engineering, pp. 277\u2013282 (2011)","DOI":"10.1109\/MUE.2011.56"},{"key":"395_CR86","doi-asserted-by":"crossref","unstructured":"Wang, K., Lin, X., Tang, W.: Predator\u2014an experience guided configuration optimizer for Hadoop MapReduce. In: Proceedings of 4th IEEE International Conference on Cloud Computing Technology and Science, pp. 419\u2013426 (2012)","DOI":"10.1109\/CloudCom.2012.6427486"},{"issue":"2","key":"395_CR87","doi-asserted-by":"crossref","first-page":"279","DOI":"10.1007\/s10723-011-9201-4","volume":"10","author":"HL Yang","year":"2012","unstructured":"Yang, H.L., Luan, Z.Z., Li, W.J., Qian, D.P.: MapReduce workload modeling with statistical approach. J. Grid Comput. 10(2), 279\u2013310 (2012)","journal-title":"J. Grid Comput."},{"issue":"4\u20135","key":"395_CR88","doi-asserted-by":"crossref","first-page":"233","DOI":"10.1016\/j.parco.2013.02.001","volume":"39","author":"W Kolberg","year":"2013","unstructured":"Kolberg, W., Marcos, P.D., Anjos, J.C.S., Miyazaki, A.K.S., Geyer, C.R., Arantes, L.B.: MRSG\u2014a MapReduce simulator over SimGrid. Parallel Comput. 39(4\u20135), 233\u2013244 (2013)","journal-title":"Parallel Comput."},{"issue":"1","key":"395_CR89","doi-asserted-by":"crossref","first-page":"300","DOI":"10.1016\/j.future.2011.05.007","volume":"29","author":"Y Liu","year":"2013","unstructured":"Liu, Y., Li, M.Z., Alham, N.K., Hammoud, S.: HSim: a MapReduce simulator in enabling cloud computing. Future Gener. Comput. Syst. 29(1), 300\u2013308 (2013)","journal-title":"Future Gener. Comput. Syst."},{"issue":"4","key":"395_CR90","doi-asserted-by":"crossref","first-page":"495","DOI":"10.1007\/s10766-012-0227-4","volume":"41","author":"E Vianna","year":"2013","unstructured":"Vianna, E., Comarela, G., Pontes, T., Almeida, J., Almeida, V., Wilkinson, K., Kuno, H., Dayal, U.: Analytical performance models for MapReduce workloads. Int. J. Parallel Prog. 41(4), 495\u2013525 (2013)","journal-title":"Int. J. Parallel Prog."},{"key":"395_CR91","doi-asserted-by":"crossref","unstructured":"Leverich, J., Kozyrakis, C.: On the energy (In) efficiency of Hadoop Clusters. In: Proceedings of HotPower (2009)","DOI":"10.1145\/1740390.1740405"},{"key":"395_CR92","doi-asserted-by":"crossref","unstructured":"Lang, W., Patel, J.: Energy management for MapReduce clusters. In: VLDB (2010)","DOI":"10.14778\/1920841.1920862"},{"key":"395_CR93","doi-asserted-by":"crossref","unstructured":"Kaushik, R.T., et al.: Evaluation and analysis if GreenHDFS: a selft-adaptive. Energy-conserving variant of the Hadoop distributed file system. In: Proceedings of IEEE CloudCom (2010)","DOI":"10.1109\/CloudCom.2010.109"},{"key":"395_CR94","doi-asserted-by":"crossref","unstructured":"Chen, Y., Alspaugh, S., Borthakur, D., Katz, R.: Energy efficiency for large-scale MapReduce workloads with significant interactive analysis. In: Proceedings of EuroSys (2012)","DOI":"10.1145\/2168836.2168842"},{"key":"395_CR95","doi-asserted-by":"crossref","unstructured":"Yoon, E., Squicciarini, A.: Toward detecting compromised MapReduce workers through log analysis. In: Proceedings of 14th IEEE\/ACM International Symposium on Cluster, Cloud and Grid Computing (2014)","DOI":"10.1109\/CCGrid.2014.120"},{"key":"395_CR96","unstructured":"Roy, I., Setty, S.T.V., Kilzer, A., Shmatikov, V., Witchel, E.: Airavat: security and privacy for MapReduce. In: NSDI (2010)"},{"key":"395_CR97","doi-asserted-by":"crossref","unstructured":"Wei, W., Du, J., Yu, T., Gu, X.: SecureMR: a service integrity assurance framework for MapReduce. In: Proceedings of 2009 Annual Computer Security Applications Conference (2009)","DOI":"10.1109\/ACSAC.2009.17"},{"key":"395_CR98","doi-asserted-by":"crossref","unstructured":"Chen, X., Huang, Q.: The data protection of MapReduce using homomorphic encryption. In: Proceedings of 4th IEEE International Conference on Software Engineering and Service Science, pp. 419\u2013421 (2013)","DOI":"10.1109\/ICSESS.2013.6615338"},{"key":"395_CR99","doi-asserted-by":"crossref","unstructured":"Guo, Z., Zhu, X., Guo, L., Kang, S.: Design of a security framework On MapReduce. In: Proceedings of 5th International Conference on Intelligent Networking and Collaborative Systems, pp. 139\u2013145 (2013)","DOI":"10.1109\/INCoS.2013.29"},{"issue":"8","key":"395_CR100","first-page":"4587","volume":"11","author":"H Han","year":"2013","unstructured":"Han, H., Zheng, W.: A privacy data-oriented hierarchical MapReduce programming model. Telkomnika Indones. J. Electr. Eng. 11(8), 4587\u20134593 (2013)","journal-title":"Telkomnika Indones. J. Electr. Eng."},{"key":"395_CR101","doi-asserted-by":"crossref","unstructured":"Zhang, C., Chang, E.-C., Yap, R.H.C.: Tagged-MapReduce: a general framework for secure computing with mixed-sensitivity data on hybrid clouds. In: Proceedings of 14th IEEE\/ACM International Symposium on Cluster, Cloud, and Grid Computing (2014)","DOI":"10.1109\/CCGrid.2014.96"},{"key":"395_CR102","unstructured":"Apache Pig. http:\/\/pig.apache.org\/ . Accessed May 2015"},{"key":"395_CR103","unstructured":"Cascading. http:\/\/www.cascading.org\/ . Accessed May 2015"},{"key":"395_CR104","unstructured":"Scalding. http:\/\/www.cascading.org\/projects\/scalding\/ . Accessed May 2015"},{"issue":"4","key":"395_CR105","first-page":"277","volume":"13","author":"R Pike","year":"2005","unstructured":"Pike, R., Dorward, S., Griesemer, R., Quinlan, S.: Interpreting the data: parallel analysis with Sawzall. Sci. Program. 13(4), 277\u2013298 (2005)","journal-title":"Sci. Program."},{"key":"395_CR106","unstructured":"Summingbird. https:\/\/github.com\/twitter\/summingbird . Accessed May 2015"},{"key":"395_CR107","doi-asserted-by":"crossref","unstructured":"Akidau, T., Balikov, A., Chernyak, S., Haberman, J., Lax, R., Mcveety, S., Mills, D., Nordstrom, P., Whittle, S.: MillWheel: faulttolerant stream processing at Internet scale. In: Proceedings of the 39th International Conference on Very Large Data Bases, VLDB, vol. 6 (2013)","DOI":"10.14778\/2536222.2536229"},{"key":"395_CR108","doi-asserted-by":"crossref","unstructured":"Lu, M., Zhang, L., Huynh, H.P., Ong, Z., Liang, Y., He, B., Goh, R.S.M., Huynh, R.: Optimizing the MapReduce framework on Intel Xeon Phi coprocessor. In: Proceedings of IEEE International Conference on Big Data (2013)","DOI":"10.1109\/BigData.2013.6691563"},{"key":"395_CR109","unstructured":"QT. http:\/\/www.qt.io\/download\/ . Accessed Oct 2015"}],"container-title":["International Journal of Parallel Programming"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10766-015-0395-0.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10766-015-0395-0\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10766-015-0395-0","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,31]],"date-time":"2025-05-31T06:33:05Z","timestamp":1748673185000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10766-015-0395-0"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,10,29]]},"references-count":109,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2016,8]]}},"alternative-id":["395"],"URL":"https:\/\/doi.org\/10.1007\/s10766-015-0395-0","relation":{},"ISSN":["0885-7458","1573-7640"],"issn-type":[{"type":"print","value":"0885-7458"},{"type":"electronic","value":"1573-7640"}],"subject":[],"published":{"date-parts":[[2015,10,29]]}}}