{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2023,6,28]],"date-time":"2023-06-28T21:33:07Z","timestamp":1687987987621},"reference-count":63,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2016,4,8]],"date-time":"2016-04-08T00:00:00Z","timestamp":1460073600000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/creativecommons.org\/licenses\/by\/4.0"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Big Data"],"published-print":{"date-parts":[[2016,12]]},"DOI":"10.1186\/s40537-016-0041-8","type":"journal-article","created":{"date-parts":[[2016,4,8]],"date-time":"2016-04-08T23:00:44Z","timestamp":1460156444000},"update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":14,"title":["Feasibility analysis of AsterixDB and Spark streaming with Cassandra for stream-based processing"],"prefix":"10.1186","volume":"3","author":[{"given":"Pekka","family":"P\u00e4\u00e4kk\u00f6nen","sequence":"first","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2016,4,8]]},"reference":[{"key":"41_CR1","doi-asserted-by":"crossref","unstructured":"Thusoo A et al. Data warehousing and analytics infrastructure at Facebook. Paper presented at the ACM SIGMOD international conference on management of data, Indianapolis, Indiana, USA, 6\u201311 June 2010.","DOI":"10.1145\/1807167.1807278"},{"key":"41_CR2","doi-asserted-by":"crossref","unstructured":"Sumbaly R, Kreps J, Shah S. The \u201cBig Data\u201d ecosystem at LinkedIn. Paper presented at the ACM SIGMOD international conference on management of data, New York, New York, USA, 22\u201327 June 2013.","DOI":"10.1145\/2463676.2463707"},{"key":"41_CR3","doi-asserted-by":"crossref","unstructured":"Mishne G, Dalton J, Li Z, Sharma A, Lin J. Fast Data in the era of Big Data: Twitter\u2019s real-time related query suggestion architecture. Paper presented at the ACM SIGMOD international conference on management of data, New York, New York, USA, 22\u201327 June 2013.","DOI":"10.1145\/2463676.2465290"},{"key":"41_CR4","doi-asserted-by":"crossref","unstructured":"Busch M et al. EarlyBird: real-time search at Twitter. Paper presented at the IEEE 28th international conference on data engineering, Washington, DC, USA, 1\u20135 April 2012.","DOI":"10.1109\/ICDE.2012.149"},{"key":"41_CR5","doi-asserted-by":"crossref","unstructured":"Kulkarni S et al. Twitter heron: stream processing at scale. Paper presented at SIGMOD 2015, Melbourne, Victoria, Australia, 31 May\u20134 June 2015.","DOI":"10.1145\/2723372.2742788"},{"key":"41_CR6","doi-asserted-by":"crossref","first-page":"11","DOI":"10.1145\/2674026.2674029","volume":"16","author":"O Goonetilleke","year":"2014","unstructured":"Goonetilleke O, Sellis T, Zhang X, Sathe S. Twitter analytics: a Big Data management perspective. SIGKDD Explor. 2014;16:11\u20139. doi: 10.1145\/2674026.2674029 .","journal-title":"SIGKDD Explor"},{"key":"41_CR7","doi-asserted-by":"crossref","first-page":"462","DOI":"10.1002\/asi.23186","volume":"66","author":"A Zubiaga","year":"2015","unstructured":"Zubiaga A, Spina D, Martinez R, Fresno V. Real-time classification of Twitter trends. J Assoc Inf Sci Tech. 2015;66:462\u201373. doi: 10.1002\/asi.23186 .","journal-title":"J Assoc Inf Sci Tech"},{"key":"41_CR8","doi-asserted-by":"crossref","first-page":"250","DOI":"10.1108\/AJIM-09-2013-0083","volume":"66","author":"MFNJ Proferes","year":"2014","unstructured":"Proferes MFNJ. A topology of Twitter research: disciplines, methods, and ethics. Aslib J Inf Manag. 2014;66:250\u201361.","journal-title":"Aslib J Inf Manag"},{"key":"41_CR9","doi-asserted-by":"crossref","unstructured":"Lu R, Wu G, Xie B, Hu J. StreamBench: towards benchmarking modern distributed stream computing frameworks. Paper presented at the IEEE\/ACM 7th international conference on utility and cloud computing, London, Great Britain, 8\u201311 December 2014.","DOI":"10.1109\/UCC.2014.15"},{"key":"41_CR10","first-page":"138","volume-title":"BDGS: a scalable Big Data generator suite in Big Data benchmarking. Lectures notes in computer science","author":"Z Ming","year":"2014","unstructured":"Ming Z, Luo C, Gao W, Han R, Yang Q, Wang L, Zhan J. BDGS: a scalable Big Data generator suite in Big Data benchmarking. Lectures notes in computer science, vol. 8585. Switzerland: Springer; 2014. p. 138\u201354."},{"key":"41_CR11","first-page":"111","volume-title":"Performance benefits of DataMPI: a case study with BigDataBench. Lecture notes in computer science","author":"F Liang","year":"2014","unstructured":"Liang F, Feng C, Lu X, Xu Z. Performance benefits of DataMPI: a case study with BigDataBench. Lecture notes in computer science, vol. 8807. Switzerland: Springer; 2014. p. 111\u201323."},{"key":"41_CR12","doi-asserted-by":"crossref","unstructured":"Zaharia M, Das T, Li H, Hunter T, Shenker S, Stoica I. Discretized streams: fault-tolerant streaming computation at scale. Paper presented at the 24th ACM symposium on operating systems principles, Farmington, Pennsylvania, USA, 3\u20136 November 2013.","DOI":"10.1145\/2517349.2522737"},{"key":"41_CR13","doi-asserted-by":"crossref","unstructured":"Borkar V, Carey MJ, Li C. Inside \u201cBig Data management\u201d: Ogres, Onions, or Parfaits? Paper presented at the EDBT\/ICDT 2012 joint conference, Berlin, Germany, 26\u201330 March 2012.","DOI":"10.1145\/2247596.2247598"},{"key":"41_CR14","unstructured":"Grover R, Carey MJ. Data ingestion in AsterixDB. Paper presented at the 18th international conference on extending database technology. Brussels, Belgium, 23\u201327 March 2015."},{"key":"41_CR15","doi-asserted-by":"crossref","first-page":"464","DOI":"10.1016\/j.ijinfomgt.2013.01.001","volume":"33","author":"W He","year":"2013","unstructured":"He W, Zha S, Li L. Social media competitive analysis and text mining: a case study in the pizza industry. Int J Inf Manage. 2013;33:464\u201372.","journal-title":"Int J Inf Manage"},{"key":"41_CR16","doi-asserted-by":"crossref","first-page":"801","DOI":"10.1016\/j.im.2015.04.006","volume":"52","author":"W He","year":"2015","unstructured":"He W, Wu H, Yan G, Akula V, Shen J. A novel social media competitive analytics framework with sentiment benchmarks. Inf Manag. 2015;52:801\u201312.","journal-title":"Inf Manag"},{"key":"41_CR17","doi-asserted-by":"crossref","first-page":"247","DOI":"10.1016\/j.ijpe.2014.12.037","volume":"165","author":"B Chae","year":"2015","unstructured":"Chae B. Insights from hashtag #supplychain and Twitter analytics: considering Twitter and Twitter data for supply chain practise and research. Int J Prod Econ. 2015;165:247\u201359.","journal-title":"Int J Prod Econ"},{"key":"41_CR18","doi-asserted-by":"crossref","first-page":"45","DOI":"10.1016\/j.inffus.2015.08.005","volume":"28","author":"G Bello-Orgaz","year":"2016","unstructured":"Bello-Orgaz G, Jung JJ, Camacho D. Social big data: recent achievements and new challenges. Inf Fusion. 2016;28:45\u201359.","journal-title":"Inf Fusion"},{"key":"41_CR19","doi-asserted-by":"crossref","first-page":"82","DOI":"10.1145\/2436256.2436274","volume":"56","author":"R Feldman","year":"2013","unstructured":"Feldman R. Techniques and applications for sentiment analysis. Commun ACM. 2013;56:82\u20139. doi: 10.1145\/2436256.2436274 .","journal-title":"Commun ACM"},{"key":"41_CR20","doi-asserted-by":"crossref","first-page":"1093","DOI":"10.1016\/j.asej.2014.04.011","volume":"5","author":"W Medhat","year":"2014","unstructured":"Medhat W, Hassan A, Korashy H. Sentiment analysis algorithms and applications: a survey. Ain Shams Eng J. 2014;5:1093\u2013113.","journal-title":"Ain Shams Eng J"},{"key":"41_CR21","unstructured":"Abbasi A, Hassan A, Dhar M. Benchmarking Twitter sentiment analysis tools. Paper presented at the 9th international conference on language resources and evaluation, Reykjavik, Iceland, 26\u201331 May 2014."},{"key":"41_CR22","doi-asserted-by":"crossref","unstructured":"Rosenthal S. SemEval-2015 Task 10: sentiment analysis in Twitter. Paper presented at the 9th international workshop on semantic evaluation, Denver, Colorado, USA; 4\u20135 June 2015.","DOI":"10.18653\/v1\/S15-2078"},{"key":"41_CR23","doi-asserted-by":"crossref","first-page":"18","DOI":"10.1016\/j.ins.2015.03.040","volume":"311","author":"J Serrano-Guerrero","year":"2015","unstructured":"Serrano-Guerrero J, Olivas JA, Romero FP, Herrera-Viedma E. Sentiment analysis: a review and comparative analysis of web services. Inf Sci. 2015;311:18\u201338.","journal-title":"Inf Sci"},{"key":"41_CR24","doi-asserted-by":"crossref","unstructured":"Gon\u00e7alves P, Ara\u00fajo M, Benevenuto F, Cha M. Comparing and combining sentiment analysis methods. Paper presented at the conference on online social networks, Boston, MA, USA, 7\u20138 October 2013.","DOI":"10.1145\/2512938.2512951"},{"key":"41_CR25","unstructured":"Esuli A, Sebastiani F. SentiWordNet: a publicly available lexical resource for opinion mining. Paper presented at the 5th conference on language technology conference, Genova, Italy, 24\u201326 May 2006."},{"key":"41_CR26","unstructured":"Baccianella S, Esuli A, Sebastiani F. SentiWordNet 3.0: an enhanced lexical resource for sentiment analysis and opinion mining. Paper presented at the 7th international conference on language resources and evaluation, Malta, 17\u201323 May 2010."},{"key":"41_CR27","doi-asserted-by":"crossref","unstructured":"Mendes PN, Passant A, Kapanipathi P. Twarql: tapping into the wisdom of the crowd. Paper presented at the 6th international conference on semantic systems, Graz, Austria, 1\u20133 September 2010.","DOI":"10.1145\/1839707.1839762"},{"key":"41_CR28","doi-asserted-by":"crossref","unstructured":"Khuc VN, Shivade C, Ramnath R, Ramanathan J. Towards building large-scale distributed systems for Twitter sentiment analysis. Symposium on applied computing, Riva del Garda, Italy, 26\u201330 March 2012.","DOI":"10.1145\/2245276.2245364"},{"key":"41_CR29","doi-asserted-by":"crossref","unstructured":"Magdy A, Alarabi L, Al-Harthi S, Musleh M, Ghanem TM, Ghani S, Mokbel MF. Taghreed: a system for querying, analyzing, and visualizing Geotagged Microblogs. Paper presented at 22nd international conference on advances in geographic information systems, Dallas, Texas, USA, 4\u20137 November 2014.","DOI":"10.1145\/2666310.2666397"},{"key":"41_CR30","doi-asserted-by":"crossref","unstructured":"Lai C, Donahue J, Musaev A, Pu C. Nimbus: tuning filters service on Tweet streams. Paper presented at the IEEE international congress on Big Data, New York, USA, 27 June\u20132 July 2015.","DOI":"10.1109\/BigDataCongress.2015.95"},{"key":"41_CR31","author":"X Fang","year":"2015","unstructured":"Fang X, Zhan J. Sentiment analysis using product review data. J Big Data. 2015. doi: 10.1186\/s40537-015-0015-2 .","journal-title":"J Big Data"},{"key":"41_CR32","doi-asserted-by":"crossref","first-page":"166","DOI":"10.1016\/j.bdr.2015.01.001","volume":"2","author":"P P\u00e4\u00e4kk\u00f6nen","year":"2015","unstructured":"P\u00e4\u00e4kk\u00f6nen P, Pakkala D. Reference architecture and classification of technologies, products and services for big data systems. Big data Res. 2015;2:166\u201386. doi: 10.1016\/j.bdr.2015.01.001 .","journal-title":"Big data Res"},{"key":"41_CR33","unstructured":"Zaharia M, Chowdhury M, Das T, Dave A, Ma\u00a0J, McCauley M, Franklin MJ, Shenker S, Stoica I. Resilient distributed datasets: A fault-tolerant abstraction for in-memory cluster computing. Paper presented at the 9th USENIX conference on networked systems design and implementation. San Jose, California, USA, 25\u201327 April 2012."},{"key":"41_CR34","unstructured":"Spark-Cassandra-Connector. 2015. https:\/\/github.com\/datastax\/spark-cassandra-connector . Accessed 17 Sep 2015."},{"key":"41_CR35","doi-asserted-by":"crossref","unstructured":"Xin RS, Rosen J, Zaharia M, Franklin MJ, Shenker S, Stoica I. Shark: SQL and rich analytics at scale. Paper presented at the SIGMOD 2013, New York, New York, USA, 22\u201327 June 2013.","DOI":"10.21236\/ADA570737"},{"key":"41_CR36","unstructured":"Xin RS. Shark, Spark SQL, Hive on Spark, and the future of SQL on Spark. In: Databricks blog. 2014. https:\/\/databricks.com\/blog\/2014\/07\/01\/shark-spark-sql-hive-on-spark-and-the-future-of-sql-on-spark.html . Accessed 10 Aug 2015."},{"key":"41_CR37","doi-asserted-by":"crossref","unstructured":"Armbrust M, Das T, Davidson A, Ghodsi A, Or A, Rosen J, Stoica I, Wendell P, Xin R, Zaharia M. Scaling Spark in the real world: performance and usability. Paper presented at the 41st international conference on very large data bases, Kohala Coast, Hawaii, USA, 31 August\u20134 September 2015.","DOI":"10.14778\/2824032.2824080"},{"key":"41_CR38","unstructured":"Xin R, Wendell P. Announcing Spark 1.5. In: Databricks blog. 2015. https:\/\/databricks.com\/blog\/2015\/09\/09\/announcing-spark-1-5.html . Accessed 20 Oct 2015."},{"key":"41_CR39","first-page":"28","volume-title":"Evaluating new approaches of Big Data analytics frameworks Lecture notes in business information processing","author":"N Spangenberg","year":"2015","unstructured":"Spangenberg N, Roth M, Franczyk. Evaluating new approaches of Big Data analytics frameworks Lecture notes in business information processing, vol. 208. Switzerland: Springer; 2015. p. 28\u201337."},{"key":"41_CR40","unstructured":"Ousterhout K, Rasti R, Ratnasamy S, Shenker S, Chun B. Making sense of performance in data analytics frameworks. Paper presented at the 12th USENIX symposium on networked systems design and implementation, Oakland, California, USA, 4\u20136 May 2015."},{"key":"41_CR41","doi-asserted-by":"crossref","first-page":"24","DOI":"10.1186\/s40537-015-0032-1","volume":"2","author":"S Landset","year":"2015","unstructured":"Landset S, Khoshgoftaar TM, Richter AN, Hasanin T. A survey of open source tools for machine learning with big data in the Hadoop ecosystem. J Big Data. 2015;2:24.","journal-title":"J Big Data"},{"key":"41_CR42","doi-asserted-by":"crossref","unstructured":"Zheng J, Dagnino A (2014) An initial study of predictive machine learning analytics on large volumes of historical data for power system applications. Paper presented at the 2014 IEEE international conference on Big Data, Washington, DC, USA, 27\u201330 October 2014.","DOI":"10.1109\/BigData.2014.7004327"},{"key":"41_CR43","doi-asserted-by":"crossref","unstructured":"Bhuvan MS et al. (2015) Semantic sentiment analysis using context specific grammar. Paper presented at international conference on computing, communication and automation, Uttar Pradesh, India, 15\u201316 May 2015.","DOI":"10.1109\/CCAA.2015.7148366"},{"key":"41_CR44","unstructured":"Nodarakis N, Sioutas S, Tsakalidis A, Tzimas G. Large scale sentiment analysis on Twitter with Spark. Paper presented at the 1st international workshop on multi-engine data analytics, Bordeaux, France, 15 March 2016."},{"key":"41_CR45","doi-asserted-by":"crossref","unstructured":"Alsubaiee S et al. AsterixDB: a scalable, open source DBMS. Paper presented at the 40st international conference on very large data bases, Hangzhou, China, 1\u20135 September 2014.","DOI":"10.14778\/2733085.2733096"},{"key":"41_CR46","doi-asserted-by":"crossref","unstructured":"Borkar V et al. Algebricks: a data model-agnostic compiler backend for Big Data languages. Paper presented at the ACM symposium on cloud computing, Kohala Coast, Hawaii, USA, 27\u201329 August 2015.","DOI":"10.1145\/2806777.2806941"},{"key":"41_CR47","doi-asserted-by":"crossref","unstructured":"Borkar V, Carey M, Grover R, Onose N, Vernica R. Hyracks: a flexible and extensible foundation for data-intensive computing. Paper presented at the 27th international conference on data engineering, Hannover, Germany, 11\u201316 April 2011.","DOI":"10.1109\/ICDE.2011.5767921"},{"key":"41_CR48","unstructured":"AsterixDB. Apache Incubator. 2015. https:\/\/asterix-jenkins.ics.uci.edu\/job\/asterix-test-full\/site\/asterix-doc\/index.html . Accessed 20 Oct 2015."},{"key":"41_CR49","doi-asserted-by":"crossref","unstructured":"Pirzadeh P, Carey MJ, Westmann T. BigFun: a performance study of big data management system functionality. Paper presented at the 2015 IEEE international conference on Big Data, Santa Clara, California, USA, 29 October\u20131 November 2015.","DOI":"10.1109\/BigData.2015.7363793"},{"key":"41_CR50","doi-asserted-by":"crossref","unstructured":"Difallah DE, Pavlo A, Curino C, Cudre-Mauroux P. OLTP-Bench: an extensible Testbed for benchmarking relational databases. Paper presented at the 39th international conference on very large data bases, Riva del Carda, Italy, 26\u201330 August 2013.","DOI":"10.14778\/2732240.2732246"},{"key":"41_CR51","doi-asserted-by":"crossref","unstructured":"Erling O et al. The LDBC social network benchmark: interactive workload. Paper presented at SIGMOD, Melbourne, Australia, 31 May\u201304 June 2015.","DOI":"10.1145\/2723372.2742786"},{"key":"41_CR52","doi-asserted-by":"crossref","unstructured":"Arlitt M, Marwah M, Bellala G, Shah A, Healey J, Vandiver B. IoTAbench: an internet of things analytics benchmark. Paper presented at the 6th ACM\/SPEC international conference on performance engineering, Austin, Texas, USA, 31 January\u20134 February 2015.","DOI":"10.1145\/2668930.2688055"},{"key":"41_CR53","doi-asserted-by":"crossref","unstructured":"Li M, Tan J, Wang Y, Zhang L, Salapura V. SparkBench: a comprehensive benchmarking suite for in memory data analytic platform Spark. Paper presented at the ACM international conference on computing frontiers, Ischia, Italy, 18\u201321 May 2015.","DOI":"10.1145\/2742854.2747283"},{"key":"41_CR54","first-page":"25","volume-title":"Towards a Big Data benchmarking and demonstration suite for the online social network era with realistic workloads and live data. Lectures notes in computer science","author":"R Zhang","year":"2016","unstructured":"Zhang R, Manotas I, Li M, Hildebrand D. Towards a Big Data benchmarking and demonstration suite for the online social network era with realistic workloads and live data. Lectures notes in computer science, vol. 9495. Switzerland: Springer; 2016. p. 25\u201336."},{"key":"41_CR55","doi-asserted-by":"crossref","unstructured":"Braun L et al. Analytics in motion. Paper presented at SIGMOD 2015, Melbourne, Victoria, Australia, 31 May\u20134 June 2015.","DOI":"10.1145\/2723372.2742783"},{"key":"41_CR56","doi-asserted-by":"crossref","first-page":"18","DOI":"10.1186\/s40537-015-0025-0","volume":"2","author":"JR Louren\u00e7o","year":"2015","unstructured":"Louren\u00e7o JR, Cabral B, Carreiro P, Vieira M, Bernardino J. Choosing the right NoSQL database for the job: a quality attribute evaluation. J Big Data. 2015;2:18. doi: 10.1186\/s40537-015-0025-0 .","journal-title":"J Big Data"},{"key":"41_CR57","doi-asserted-by":"crossref","unstructured":"Klein J et al. Performance evaluation of NoSQL databases: a case study. Paper presented at the 1st workshop on performance analysis of Big Data systems, Austin, Texas, USA, 31 January\u20134 February 2015.","DOI":"10.1145\/2694730.2694731"},{"key":"41_CR58","doi-asserted-by":"crossref","unstructured":"Rabl T et al. Solving Big Data challenges for enterprise application performance management. Paper presented at the 38th international conference on very large data bases, Istanbul, Turkey, 27\u201331 August 2012.","DOI":"10.14778\/2367502.2367512"},{"key":"41_CR59","doi-asserted-by":"crossref","unstructured":"P\u00e4\u00e4kk\u00f6nen P, Pakkala D. The implications of disk-based RAID and virtualization for write-intensive services. Paper presented at the 30th Annual ACM Symposium on Applied Computing, Salamanca, Spain, 13\u201317 April 2015.","DOI":"10.1145\/2695664.2695982"},{"key":"41_CR60","unstructured":"Black EB. \u201cinverted index\u201d, in dictionary of algorithms and data structures.\u00a02008. https:\/\/xlinux.nist.gov\/dads\/\/HTML\/invertedIndex.html . Accessed 18 Jan 2016."},{"key":"41_CR61","unstructured":"Twitter API. Tweets. 2015 https:\/\/dev.twitter.com\/overview\/api\/tweets . Accessed 13 Nov 2015."},{"key":"41_CR62","volume-title":"Lightning Fast Cluster Computing with Cassandra and Spark","author":"P Kolaczkowski","year":"2014","unstructured":"Kolaczkowski P. Lightning Fast Cluster Computing with Cassandra and Spark. London: Code Mesh; 2014."},{"key":"41_CR63","first-page":"453","volume-title":"A comparative study on Twitter sentiment analysis: which features are good? Lectures notes in computer science","author":"F Koto","year":"2015","unstructured":"Koto F, Adriani M. A comparative study on Twitter sentiment analysis: which features are good? Lectures notes in computer science, vol. 9103. Switzerland: Springer; 2015. p. 453\u20137."}],"container-title":["Journal of Big Data"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s40537-016-0041-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1186\/s40537-016-0041-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1186\/s40537-016-0041-8","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2019,9,6]],"date-time":"2019-09-06T11:03:31Z","timestamp":1567767811000},"score":1,"resource":{"primary":{"URL":"http:\/\/journalofbigdata.springeropen.com\/articles\/10.1186\/s40537-016-0041-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,4,8]]},"references-count":63,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2016,12]]}},"alternative-id":["41"],"URL":"https:\/\/doi.org\/10.1186\/s40537-016-0041-8","relation":{},"ISSN":["2196-1115"],"issn-type":[{"value":"2196-1115","type":"electronic"}],"subject":[],"published":{"date-parts":[[2016,4,8]]},"article-number":"6"}}