{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,28]],"date-time":"2026-04-28T08:34:44Z","timestamp":1777365284407,"version":"3.51.4"},"reference-count":106,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2025,5,23]],"date-time":"2025-05-23T00:00:00Z","timestamp":1747958400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"},{"start":{"date-parts":[[2025,5,23]],"date-time":"2025-05-23T00:00:00Z","timestamp":1747958400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["J Big Data"],"DOI":"10.1186\/s40537-025-01186-7","type":"journal-article","created":{"date-parts":[[2025,5,23]],"date-time":"2025-05-23T06:50:03Z","timestamp":1747983003000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":5,"title":["The wisdom of the lexicon crowds: leveraging on decades of lexicon-based sentiment analysis for improved results"],"prefix":"10.1186","volume":"12","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-3417-3121","authenticated-orcid":false,"given":"Chelsey H.","family":"Hill","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9985-8362","authenticated-orcid":false,"given":"Jorge E.","family":"Fresneda","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0009-0007-6730-8922","authenticated-orcid":false,"given":"Murugan","family":"Anandarajan","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,5,23]]},"reference":[{"issue":"8","key":"1186_CR1","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3548772","volume":"55","author":"T Abdullah","year":"2022","unstructured":"Abdullah T, Ahmet A. Deep learning in sentiment analysis: recent architectures. ACM Comput Surv. 2022;55(8):1\u201335. https:\/\/doi.org\/10.1145\/3548772.","journal-title":"ACM Comput Surv"},{"key":"1186_CR2","doi-asserted-by":"crossref","unstructured":"Akter S, Aziz MT. (2016, 22\u201324 Sept. 2016). Sentiment analysis on facebook group using lexicon based approach. 2016 3rd International Conference on Electrical Engineering and Information Communication Technology (ICEEICT).","DOI":"10.1109\/CEEICT.2016.7873080"},{"issue":"1","key":"1186_CR3","doi-asserted-by":"publisher","first-page":"79","DOI":"10.1186\/s40537-022-00633-z","volume":"9","author":"RH Ali","year":"2022","unstructured":"Ali RH, Pinto G, Lawrie E, Linstead EJ. A large-scale sentiment analysis of tweets pertaining to the 2020 US presidential election. J Big Data. 2022;9(1):79. https:\/\/doi.org\/10.1186\/s40537-022-00633-z.","journal-title":"J Big Data"},{"key":"1186_CR4","doi-asserted-by":"crossref","unstructured":"Anandarajan M, Hill C, Nolan T. Practical text analytics. Volume 2. Springer; 2019.","DOI":"10.1007\/978-3-319-95663-3"},{"key":"1186_CR5","doi-asserted-by":"publisher","first-page":"937","DOI":"10.1016\/j.procs.2018.05.109","volume":"132","author":"Ankit","year":"2018","unstructured":"Ankit, Saleena N. An ensemble classification system for Twitter sentiment analysis. Procedia Comput Sci. 2018;132:937\u201346. https:\/\/doi.org\/10.1016\/j.procs.2018.05.109.","journal-title":"Procedia Comput Sci"},{"issue":"8","key":"1186_CR6","doi-asserted-by":"publisher","first-page":"1485","DOI":"10.1287\/mnsc.1110.1370","volume":"57","author":"N Archak","year":"2011","unstructured":"Archak N, Ghose A, Ipeirotis PG. Deriving the pricing power of product features by mining consumer reviews. Manage Sci. 2011;57(8):1485\u2013509. https:\/\/doi.org\/10.1287\/mnsc.1110.1370.","journal-title":"Manage Sci"},{"key":"1186_CR7","doi-asserted-by":"crossref","unstructured":"Aufar M, Andreswari R, Pramesti D. (2020, 5\u20136 Aug. 2020). Sentiment Analysis on Youtube Social Media Using Decision Tree and Random Forest Algorithm: A Case Study. 2020 International Conference on Data Science and Its Applications (ICoDSA).","DOI":"10.1109\/ICoDSA50139.2020.9213078"},{"key":"1186_CR8","doi-asserted-by":"publisher","DOI":"10.1109\/ASONAM.2014.6921696","volume-title":"Simpler is better?? Lexicon-based ensemble sentiment classification beats supervised methods","author":"L Augustyniak","year":"2014","unstructured":"Augustyniak L, Kajdanowicz T, Szymanski P, Tulig\u0142owicz W, Kazienko P, Alhajj R, Szymanski B. Simpler is better?? Lexicon-based ensemble sentiment classification beats supervised methods. Advances in Social Network Analysis and Mining, Beijing, China: IEEE\/ACM Int. Conf; 2014."},{"issue":"1","key":"1186_CR9","doi-asserted-by":"publisher","first-page":"4","DOI":"10.3390\/e18010004","volume":"18","author":"\u0141 Augustyniak","year":"2016","unstructured":"Augustyniak \u0141, Szyma\u0144ski P, Kajdanowicz T, Tulig\u0142owicz W. Comprehensive study on Lexicon-based ensemble classification sentiment analysis. Entropy. 2016;18(1):4. https:\/\/www.mdpi.com\/1099-4300\/18\/1\/4.","journal-title":"Entropy"},{"key":"1186_CR10","unstructured":"Baccianella S, Esuli A, Sebastiani F. (2010). Sentiwordnet 3.0: an enhanced lexical resource for sentiment analysis and opinion mining. International Conference on Language Resources and Evaluation, Valletta, Malta."},{"issue":"1","key":"1186_CR11","doi-asserted-by":"publisher","first-page":"10","DOI":"10.1186\/s40537-023-00861-x","volume":"11","author":"K Barik","year":"2024","unstructured":"Barik K, Misra S. Analysis of customer reviews with an improved VADER lexicon classifier. J Big Data. 2024;11(1):10. https:\/\/doi.org\/10.1186\/s40537-023-00861-x.","journal-title":"J Big Data"},{"key":"1186_CR12","doi-asserted-by":"crossref","unstructured":"Bayhaqy A, Sfenrianto S, Nainggolan K, Kaburuan ER. (2018). Sentiment analysis about E-commerce from tweets using decision tree, K-nearest neighbor, and na\u00efve bayes. 2018 international conference on orange technologies (ICOT).","DOI":"10.1109\/ICOT.2018.8705796"},{"key":"1186_CR13","doi-asserted-by":"publisher","first-page":"460","DOI":"10.1016\/j.tourman.2018.09.010","volume":"70","author":"J-W Bi","year":"2019","unstructured":"Bi J-W, Liu Y, Fan Z-P, Zhang J. Wisdom of crowds: conducting importance-performance analysis (IPA) through online reviews. Tour Manag. 2019;70:460\u201378. https:\/\/doi.org\/10.1016\/j.tourman.2018.09.010.","journal-title":"Tour Manag"},{"key":"1186_CR14","unstructured":"Bradley MM, Lang PJ. (1999). Affective norms for English words (ANEW): Instruction manual and affective ratings. Technical report C-1, the center for research in psychophysiology, University of Florida 30(1), 25\u201336."},{"issue":"2","key":"1186_CR15","doi-asserted-by":"publisher","first-page":"123","DOI":"10.1007\/BF00058655","volume":"24","author":"L Breiman","year":"1996","unstructured":"Breiman L. Bagging predictors. Mach Learn. 1996;24(2):123\u201340.","journal-title":"Mach Learn"},{"issue":"1","key":"1186_CR16","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1023\/A:1010933404324","volume":"45","author":"L Breiman","year":"2001","unstructured":"Breiman L. Random forests. Mach Learn. 2001;45(1):5\u201332.","journal-title":"Mach Learn"},{"key":"1186_CR17","unstructured":"Brown A, Rambaccussing D, Reade JJ, Rossi G. Using social media to identify market inefficiencies. evidence from Twitter and Betfair; 2016."},{"issue":"1","key":"1186_CR18","doi-asserted-by":"publisher","first-page":"170","DOI":"10.1016\/j.ejor.2020.05.034","volume":"288","author":"D Butler","year":"2021","unstructured":"Butler D, Butler R, Eakins J. Expert performance and crowd wisdom: evidence from english premier league predictions. Eur J Oper Res. 2021;288(1):170\u201382. https:\/\/doi.org\/10.1016\/j.ejor.2020.05.034.","journal-title":"Eur J Oper Res"},{"key":"1186_CR19","doi-asserted-by":"publisher","first-page":"187","DOI":"10.1177\/1748301818761132","volume":"12","author":"H Butler","year":"2018","unstructured":"Butler H, Friend M, Bauer KW, Bihl TJ. The effectiveness of using diversity to select multiple classifier systems with varying classification thresholds. J Algorithms Comput Technol. 2018;12:187\u201399.","journal-title":"J Algorithms Comput Technol"},{"key":"1186_CR20","unstructured":"Cambria E, Poria S, Bajpai R, Schuller B. (2016). SenticNet 4: A semantic resource for sentiment analysis based on conceptual primitives. International Conference on Computational linguistics, Osaka, Japan."},{"key":"1186_CR21","doi-asserted-by":"publisher","first-page":"247","DOI":"10.1016\/j.ijpe.2014.12.037","volume":"165","author":"B Chae","year":"2015","unstructured":"Chae B. Insights from hashtag #supplychain and Twitter analytics: considering Twitter and Twitter data for supply chain practice and research. Int J Prod Econ. 2015;165:247\u201359. https:\/\/doi.org\/10.1016\/j.ijpe.2014.12.037.","journal-title":"Int J Prod Econ"},{"issue":"5","key":"1186_CR22","doi-asserted-by":"publisher","first-page":"1367","DOI":"10.1093\/rfs\/hhu001","volume":"27","author":"H Chen","year":"2014","unstructured":"Chen H, De P, Hu YJ, Hwang B-H. Wisdom of crowds: the value of stock opinions transmitted through social media. Rev Financial Stud. 2014;27(5):1367\u2013403.","journal-title":"Rev Financial Stud"},{"key":"1186_CR23","doi-asserted-by":"publisher","first-page":"61","DOI":"10.1016\/j.knosys.2014.06.001","volume":"71","author":"H Cho","year":"2014","unstructured":"Cho H, Kim S, Lee J, Lee J-S. Data-driven integration of multiple sentiment dictionaries for lexicon-based sentiment classification of product reviews. Knowl Based Syst. 2014;71:61\u201371. https:\/\/doi.org\/10.1016\/j.knosys.2014.06.001.","journal-title":"Knowl Based Syst"},{"issue":"1","key":"1186_CR24","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1177\/001316446002000104","volume":"20","author":"J Cohen","year":"1960","unstructured":"Cohen J. A coefficient of agreement for nominal scales. Educ Psychol Meas. 1960;20(1):37\u201346. https:\/\/doi.org\/10.1177\/001316446002000104.","journal-title":"Educ Psychol Meas"},{"key":"1186_CR25","doi-asserted-by":"publisher","first-page":"e0275910","DOI":"10.1371\/journal.pone.0275910","volume":"17","author":"G Czarnek","year":"2022","unstructured":"Czarnek G, Stillwell D. Two is better [report]han [report]ne: using a single [report]motion lexicon can lead [report]o unreliable conclusions [Report]. PLoS ONE. 2022;17:e0275910.","journal-title":"PLoS ONE"},{"key":"1186_CR26","doi-asserted-by":"publisher","first-page":"170","DOI":"10.1016\/j.dss.2014.07.003","volume":"66","author":"NFF da Silva","year":"2014","unstructured":"da Silva NFF, Hruschka ER, Hruschka ER. Tweet sentiment analysis with classifier ensembles. Decis Support Syst. 2014;66:170\u20139. https:\/\/doi.org\/10.1016\/j.dss.2014.07.003.","journal-title":"Decis Support Syst"},{"key":"1186_CR27","doi-asserted-by":"publisher","first-page":"65","DOI":"10.1016\/j.dss.2016.11.001","volume":"94","author":"S Deng","year":"2017","unstructured":"Deng S, Sinha AP, Zhao H. Adapting sentiment lexicons to domain-specific social media texts. Decis Support Syst. 2017;94:65\u201376. https:\/\/doi.org\/10.1016\/j.dss.2016.11.001.","journal-title":"Decis Support Syst"},{"issue":"6","key":"1186_CR28","doi-asserted-by":"publisher","first-page":"480","DOI":"10.1108\/JCM-03-2017-2141","volume":"34","author":"C Dhaoui","year":"2017","unstructured":"Dhaoui C, Webster CM, Tan LP. Social media sentiment analysis: lexicon versus machine learning. J Consumer Mark. 2017;34(6):480\u20138. https:\/\/doi.org\/10.1108\/JCM-03-2017-2141.","journal-title":"J Consumer Mark"},{"key":"1186_CR29","doi-asserted-by":"publisher","first-page":"113769","DOI":"10.1016\/j.dss.2022.113769","volume":"162","author":"S Dhar","year":"2022","unstructured":"Dhar S, Bose I. Walking on air or hopping mad? Understanding the impact of emotions, sentiments and reactions on ratings in online customer reviews of mobile apps. Decis Support Syst. 2022;162:113769.","journal-title":"Decis Support Syst"},{"key":"1186_CR30","doi-asserted-by":"publisher","first-page":"707","DOI":"10.1016\/j.procs.2019.11.174","volume":"161","author":"Z Drus","year":"2019","unstructured":"Drus Z, Khalid H. Sentiment analysis in social media and its application: systematic literature review. Procedia Comput Sci. 2019;161:707\u201314. https:\/\/doi.org\/10.1016\/j.procs.2019.11.174.","journal-title":"Procedia Comput Sci"},{"issue":"7","key":"1186_CR31","doi-asserted-by":"publisher","first-page":"835","DOI":"10.1016\/j.im.2016.03.008","volume":"53","author":"M Eickhoff","year":"2016","unstructured":"Eickhoff M, Muntermann J. Stock analysts vs. the crowd: mutual prediction and the drivers of crowd wisdom. Inf Manag. 2016;53(7):835\u201345. https:\/\/doi.org\/10.1016\/j.im.2016.03.008.","journal-title":"Inf Manag"},{"key":"1186_CR32","doi-asserted-by":"publisher","unstructured":"Elsaid Moussa M, Mohamed H, E., Hassan Haggag M. Opinion mining: a hybrid framework based on lexicon and machine learning approaches. Int J Comput Appl. 2019;1\u20139. https:\/\/doi.org\/10.1080\/1206212X.2019.1615250.","DOI":"10.1080\/1206212X.2019.1615250"},{"key":"1186_CR33","volume-title":"SentiMerge: combining sentiment lexicons in a bayesian framework","author":"G Emerson","year":"2014","unstructured":"Emerson G, Declerck T. SentiMerge: combining sentiment lexicons in a bayesian framework. Ireland: Workshop on Lexical and Grammatical Resources for Language Processing, Dublin; 2014."},{"key":"1186_CR34","doi-asserted-by":"publisher","first-page":"26","DOI":"10.1016\/j.dss.2014.10.004","volume":"68","author":"E Fersini","year":"2014","unstructured":"Fersini E, Messina E, Pozzi FA. Sentiment analysis: bayesian ensemble learning. Decis Support Syst. 2014;68:26\u201338. https:\/\/doi.org\/10.1016\/j.dss.2014.10.004.","journal-title":"Decis Support Syst"},{"key":"1186_CR35","doi-asserted-by":"publisher","unstructured":"Fu T, Abbasi A, Zeng D, Chen H. Sentimental spidering: leveraging opinion information in focused crawlers. ACM Trans Inf Syst. 2012;30(4). https:\/\/doi.org\/10.1145\/2382438.2382443.","DOI":"10.1145\/2382438.2382443"},{"key":"1186_CR36","doi-asserted-by":"publisher","first-page":"450","DOI":"10.1038\/075450a0","volume":"75","author":"F Galton","year":"1907","unstructured":"Galton F. The wisdom of crowds. Nature. 1907;75:450\u20131.","journal-title":"Nature"},{"issue":"3","key":"1186_CR37","doi-asserted-by":"publisher","first-page":"1267","DOI":"10.1111\/jofi.12027","volume":"68","author":"D Garcia","year":"2013","unstructured":"Garcia D. Sentiment during recessions. J Finance. 2013;68(3):1267\u2013300. https:\/\/doi.org\/10.1111\/jofi.12027.","journal-title":"J Finance"},{"issue":"1","key":"1186_CR38","doi-asserted-by":"publisher","first-page":"44","DOI":"10.1186\/s40537-018-0152-5","volume":"5","author":"M Ghosh","year":"2018","unstructured":"Ghosh M, Sanyal G. An ensemble approach to stabilize the features for multi-domain sentiment analysis using supervised machine learning. J Big Data. 2018;5(1):44. https:\/\/doi.org\/10.1186\/s40537-018-0152-5.","journal-title":"J Big Data"},{"issue":"9","key":"1186_CR39","doi-asserted-by":"publisher","first-page":"699","DOI":"10.1016\/S0262-8856(01)00045-2","volume":"19","author":"G Giacinto","year":"2001","unstructured":"Giacinto G, Roli F. Design of effective neural network ensembles for image classification purposes. Image Vis Comput. 2001;19(9):699\u2013707.","journal-title":"Image Vis Comput"},{"issue":"3","key":"1186_CR40","doi-asserted-by":"publisher","first-page":"497","DOI":"10.1287\/isre.2016.0635","volume":"27","author":"PB Goes","year":"2016","unstructured":"Goes PB, Guo C, Lin M. Do incentive hierarchies induce user effort? Evidence from an online knowledge exchange. Inform Syst Res. 2016;27(3):497\u2013516.","journal-title":"Inform Syst Res"},{"issue":"2","key":"1186_CR41","doi-asserted-by":"publisher","first-page":"222","DOI":"10.1287\/isre.2013.0512","volume":"25","author":"PB Goes","year":"2014","unstructured":"Goes PB, Lin M, Au Yeung C-m. Popularity effect in user-generated content: evidence from online product reviews. Inform Syst Res. 2014;25(2):222\u201338.","journal-title":"Inform Syst Res"},{"key":"1186_CR42","doi-asserted-by":"publisher","unstructured":"Gon\u00e7alves P, Ara\u00fajo M, Benevenuto F, Cha M. (2013). Comparing and combining sentiment analysis methods Proceedings of the first ACM conference on Online social networks, Boston, Massachusetts, USA. https:\/\/doi.org\/10.1145\/2512938.2512951","DOI":"10.1145\/2512938.2512951"},{"key":"1186_CR43","doi-asserted-by":"crossref","unstructured":"Hamilton WL, Clark K, Leskovec J, Jurafsky D. (2016). Inducing domain-specific sentiment lexicons from unlabeled corpora. Proceedings of the conference on empirical methods in natural language processing. conference on empirical methods in natural language processing.","DOI":"10.18653\/v1\/D16-1057"},{"issue":"4","key":"1186_CR44","doi-asserted-by":"publisher","first-page":"423","DOI":"10.1002\/asi.24255","volume":"71","author":"H Hong","year":"2020","unstructured":"Hong H, Ye Q, Du Q, Wang GA, Fan W. Crowd characteristics and crowd wisdom: evidence from an online investment community. J Association Inform Sci Technol. 2020;71(4):423\u201335. https:\/\/doi.org\/10.1002\/asi.24255.","journal-title":"J Association Inform Sci Technol"},{"issue":"5","key":"1186_CR45","doi-asserted-by":"publisher","first-page":"580","DOI":"10.1111\/jpim.12396","volume":"34","author":"S Hoornaert","year":"2017","unstructured":"Hoornaert S, Ballings M, Malthouse EC, Van den Poel D. Identifying new product [Article]deas: waiting for [Article]he wisdom of [Article]he [Article]rowd or screening [Article]deas [Article]n [Article]eal [Article]ime [Article]. J Prod Innov Manage. 2017;34(5):580\u201397. https:\/\/doi.org\/10.1111\/jpim.12396.","journal-title":"J Prod Innov Manage"},{"key":"1186_CR46","doi-asserted-by":"publisher","DOI":"10.2307\/41703503","author":"C Hsinchun","year":"2012","unstructured":"Hsinchun C, Chiang RHL, Storey VC. MIS Q. 2012;36(4):1165\u201388. https:\/\/doi.org\/10.2307\/41703503. BUSINESS INTELLIGENCE AND ANALYTICS: FROM BIG DATA TO BIG IMPACT [Article]."},{"key":"1186_CR47","doi-asserted-by":"crossref","unstructured":"Hu M, Liu B. (2004). Mining and summarizing customer reviews. International Conference on Knowledge Discovery and Data Mining, Seattle, WA.","DOI":"10.1145\/1014052.1014073"},{"key":"1186_CR48","doi-asserted-by":"crossref","unstructured":"Hutto C, Gilbert E. (2014). Vader: A parsimonious rule-based model for sentiment analysis of social media text. International AAAI Conference on Web and Social Media, Ann Arbor, MI.","DOI":"10.1609\/icwsm.v8i1.14550"},{"key":"1186_CR49","unstructured":"Jockers ML. (2017). Syuzhet: extract sentiment and plot arcs from text. GitHub Retrieved 04\/15\/2021 from https:\/\/github.com\/mjockers\/syuzhet"},{"key":"1186_CR50","doi-asserted-by":"crossref","unstructured":"Jockers ML, Thalken R. Text analysis with R: for students of literature. Springer; 2020.","DOI":"10.1007\/978-3-030-39643-5"},{"issue":"1","key":"1186_CR51","doi-asserted-by":"publisher","first-page":"165","DOI":"10.1287\/isre.2014.0562","volume":"26","author":"SL Johnson","year":"2015","unstructured":"Johnson SL, Safadi H, Faraj S. The emergence of online community leadership. Inform Syst Res. 2015;26(1):165\u201387.","journal-title":"Inform Syst Res"},{"issue":"1","key":"1186_CR52","doi-asserted-by":"publisher","first-page":"5","DOI":"10.1186\/s40537-022-00680-6","volume":"10","author":"G Kaur","year":"2023","unstructured":"Kaur G, Sharma A. A deep learning-based model using hybrid feature extraction approach for consumer sentiment analysis. J Big Data. 2023;10(1):5. https:\/\/doi.org\/10.1186\/s40537-022-00680-6.","journal-title":"J Big Data"},{"key":"1186_CR53","doi-asserted-by":"publisher","first-page":"113304","DOI":"10.1016\/j.dss.2020.113304","volume":"135","author":"J Kazmaier","year":"2020","unstructured":"Kazmaier J, van Vuuren JH. A generic framework for sentiment analysis: leveraging opinion-bearing data to inform decision making. Decis Support Syst. 2020;135:113304. https:\/\/doi.org\/10.1016\/j.dss.2020.113304.","journal-title":"Decis Support Syst"},{"key":"1186_CR54","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s40294-016-0016-9","volume":"4","author":"MT Khan","year":"2016","unstructured":"Khan MT, Durrani MY, Ali A, Inayat I, Khalid S, Khan KH. Sentiment analysis and the complex natural Language. Complex Adapt Syst Model. 2016;4:1\u201319.","journal-title":"Complex Adapt Syst Model"},{"issue":"4","key":"1186_CR55","doi-asserted-by":"publisher","first-page":"491","DOI":"10.1177\/0165551517703514","volume":"44","author":"CSG Khoo","year":"2018","unstructured":"Khoo CSG, Johnkhan SB. Lexicon-based sentiment analysis: comparative evaluation of six sentiment lexicons. J Inform Sci. 2018;44(4):491\u2013511.","journal-title":"J Inform Sci"},{"key":"1186_CR56","unstructured":"Khoo CSG, Nourbakhsh A, Na JC. (2012). Sentiment analysis of online news text: a case study of appraisal theory. Online Inf Rev."},{"issue":"3","key":"1186_CR57","doi-asserted-by":"publisher","first-page":"766","DOI":"10.1177\/1094428117719322","volume":"21","author":"VB Kobayashi","year":"2018","unstructured":"Kobayashi VB, Mol ST, Berkers HA, Kismih\u00f3k G, Hartog D, D. N. Text classification for organizational researchers:a tutorial. Organizational Res Methods. 2018a;21(3):766\u201399.","journal-title":"Organizational Res Methods"},{"issue":"3","key":"1186_CR58","doi-asserted-by":"publisher","first-page":"733","DOI":"10.1177\/1094428117722619","volume":"21","author":"VB Kobayashi","year":"2018","unstructured":"Kobayashi VB, Mol ST, Berkers HA, Kismih\u00f3k G, Hartog D, D. N. Text mining in organizational research. Organizational Res Methods. 2018b;21(3):733\u201365.","journal-title":"Organizational Res Methods"},{"key":"1186_CR59","unstructured":"Kolchyna O, Souza TTP, Treleaven P, Aste T. (2015). Twitter sentiment analysis: Lexicon method, machine learning method and their combination. arXiv preprint arXiv:1507.00955."},{"issue":"2","key":"1186_CR60","doi-asserted-by":"publisher","first-page":"181","DOI":"10.1023\/A:1022859003006","volume":"51","author":"LI Kuncheva","year":"2003","unstructured":"Kuncheva LI, Whitaker CJ. Measures of diversity in classifier ensembles and their relationship with the ensemble accuracy. Mach Learn. 2003;51(2):181\u2013207.","journal-title":"Mach Learn"},{"issue":"4","key":"1186_CR61","doi-asserted-by":"publisher","first-page":"940","DOI":"10.1287\/isre.2016.0674","volume":"27","author":"T Lappas","year":"2016","unstructured":"Lappas T, Sabnis G, Valkanas G. The impact of fake reviews on online visibility: A vulnerability assessment of the hotel industry. Inform Syst Res. 2016;27(4):940\u201361.","journal-title":"Inform Syst Res"},{"issue":"4","key":"1186_CR62","doi-asserted-by":"publisher","first-page":"1239","DOI":"10.2307\/41703506","volume":"36","author":"RYK Lau","year":"2012","unstructured":"Lau RYK, Liao SSY, Wong KF, Chiu DKW, SCANNING AND ADAPTIVE DECISION SUPPORT FOR BUSINESS MERGERS AND ACQUISITIONS [Article]. WEB 2.0 ENVIRONMENTAL. MIS Q. 2012;36(4):1239\u2013A1236. https:\/\/doi.org\/10.2307\/41703506.","journal-title":"MIS Q"},{"key":"1186_CR63","doi-asserted-by":"publisher","first-page":"245","DOI":"10.1007\/s12599-010-0114-8","volume":"2","author":"JM Leimeister","year":"2010","unstructured":"Leimeister JM. Collective intelligence. Bus Inform Syst Eng. 2010;2:245\u20138.","journal-title":"Bus Inform Syst Eng"},{"key":"1186_CR64","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1016\/j.knosys.2018.06.019","volume":"160","author":"Y Li","year":"2018","unstructured":"Li Y, Guo H, Zhang Q, Gu M, Yang J. Imbalanced text sentiment classification using universal and domain-specific knowledge. Knowl Based Syst. 2018;160:1\u201315. https:\/\/doi.org\/10.1016\/j.knosys.2018.06.019.","journal-title":"Knowl Based Syst"},{"key":"1186_CR65","doi-asserted-by":"crossref","unstructured":"Liu B. Sentiment analysis and opinion mining. Volume 1. Morgan & Claypool; 2012.","DOI":"10.1007\/978-3-031-02145-9_1"},{"key":"1186_CR66","unstructured":"Liu X, Zhang S, Wei F, Zhou M. (2011). Recognizing named entities in tweets Proceedings of the 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies - Volume 1, Portland, Oregon."},{"key":"1186_CR67","unstructured":"Loria S. (2017). TextBlob: Simplified Text Processing. Retrieved 04\/14\/2021 from https:\/\/textblob.readthedocs.io\/en\/dev\/"},{"issue":"4","key":"1186_CR68","doi-asserted-by":"publisher","first-page":"1187","DOI":"10.1111\/1475-679X.12123","volume":"54","author":"T Loughran","year":"2016","unstructured":"Loughran T, McDonald B. Textual analysis in accounting and finance: A survey. J Accounting Res. 2016;54(4):1187\u2013230.","journal-title":"J Accounting Res"},{"key":"1186_CR69","doi-asserted-by":"publisher","first-page":"357","DOI":"10.1146\/annurev-financial-012820-032249","volume":"12","author":"T Loughran","year":"2020","unstructured":"Loughran T, McDonald B. Textual analysis in finance. Annual Rev Financial Econ. 2020;12:357\u201375.","journal-title":"Annual Rev Financial Econ"},{"issue":"4","key":"1186_CR70","doi-asserted-by":"publisher","first-page":"680","DOI":"10.1016\/j.dss.2012.05.025","volume":"53","author":"I Maks","year":"2012","unstructured":"Maks I, Vossen P. A lexicon model for deep sentiment analysis and opinion mining applications. Decis Support Syst. 2012;53(4):680\u20138.","journal-title":"Decis Support Syst"},{"key":"1186_CR71","doi-asserted-by":"publisher","first-page":"101889","DOI":"10.1109\/ACCESS.2022.3209662","volume":"10","author":"A Mardjo","year":"2022","unstructured":"Mardjo A, Choksuchat C. HyVADRF: hybrid VADER\u2013Random forest and GWO for bitcoin tweet sentiment analysis. IEEE Access. 2022;10:101889\u201397.","journal-title":"IEEE Access"},{"key":"1186_CR72","doi-asserted-by":"publisher","first-page":"98","DOI":"10.1016\/j.dss.2016.06.013","volume":"89","author":"M Meire","year":"2016","unstructured":"Meire M, Ballings M, Van den Poel D. The added value of auxiliary data in sentiment analysis of Facebook posts. Decis Support Syst. 2016;89:98\u2013112.","journal-title":"Decis Support Syst"},{"key":"1186_CR73","doi-asserted-by":"publisher","DOI":"10.1007\/s10796-021-10107-x","author":"S Mendon","year":"2021","unstructured":"Mendon S, Dutta P, Behl A, Lessmann S. A hybrid approach of machine learning and lexicons to sentiment analysis: enhanced insights from Twitter data of natural disasters. Inform Syst Front. 2021. https:\/\/doi.org\/10.1007\/s10796-021-10107-x.","journal-title":"Inform Syst Front"},{"key":"1186_CR74","unstructured":"Mohammad S, Turney P. (2010). Emotions evoked by common words and phrases: Using mechanical turk to create an emotion lexicon. NAACL HLT 2010 workshop on computational approaches to analysis and generation of emotion in text, Los Angeles, CA."},{"key":"1186_CR75","doi-asserted-by":"publisher","first-page":"1533","DOI":"10.1287\/mnsc.2015.2207","volume":"62","author":"E Mollick","year":"2015","unstructured":"Mollick E, Nanda R. Wisdom or madness? Comparing crowds with expert evaluation in funding the arts. Manage Sci. 2015;62:1533\u201353.","journal-title":"Manage Sci"},{"key":"1186_CR76","doi-asserted-by":"crossref","unstructured":"Mudinas A, Zhang D, Levene M. (2012). Combining lexicon and learning based approaches for concept-level sentiment analysis Proceedings of the First International Workshop on Issues of Sentiment Discovery and Opinion Mining, Beijing, China.","DOI":"10.1145\/2346676.2346681"},{"issue":"2","key":"1186_CR77","doi-asserted-by":"publisher","first-page":"126","DOI":"10.1038\/s41562-017-0273-4","volume":"2","author":"J Navajas","year":"2018","unstructured":"Navajas J, Niella T, Garbulsky G, Bahrami B, Sigman M. Aggregated knowledge from a small number of debates outperforms the wisdom of large crowds. Nat Hum Behav. 2018;2(2):126\u201332. https:\/\/doi.org\/10.1038\/s41562-017-0273-4.","journal-title":"Nat Hum Behav"},{"key":"1186_CR78","unstructured":"Nielsen F\u00c5. (2011). A new ANEW: Evaluation of a word list for sentiment analysis in microblogs. arXiv preprint arXiv:1103.2903."},{"key":"1186_CR79","first-page":"303","volume":"84","author":"M Nofer","year":"2014","unstructured":"Nofer M, Hinz O. Are crowds on the internet wiser than experts? The case of a stock prediction community. J Bus Econ. 2014;84:303\u201338.","journal-title":"J Bus Econ"},{"key":"1186_CR80","doi-asserted-by":"crossref","unstructured":"O\u2019Connor B, Balasubramanyan R, Routledge B, Smith N. (2010). From tweets to polls: Linking text sentiment to public opinion time series. Proceedings of the International AAAI Conference on Web and Social Media.","DOI":"10.1609\/icwsm.v4i1.14031"},{"key":"1186_CR81","doi-asserted-by":"publisher","first-page":"22260","DOI":"10.1109\/ACCESS.2022.3149482","volume":"10","author":"R Obiedat","year":"2022","unstructured":"Obiedat R, Qaddoura R, Al-Zoubi AM, Al-Qaisi L, Harfoushi O, Alrefai M, Faris H. Sentiment analysis of customers\u2019 reviews using a hybrid evolutionary SVM-Based approach in an imbalanced data distribution. IEEE Access. 2022;10:22260\u201373.","journal-title":"IEEE Access"},{"issue":"4","key":"1186_CR82","doi-asserted-by":"publisher","first-page":"461","DOI":"10.1108\/DTA-09-2020-0200","volume":"55","author":"S Osorio Angel","year":"2021","unstructured":"Osorio Angel S, Pe\u00f1a P\u00e9rez Negr\u00f3n A, Espinoza-Valdez A. Systematic literature review of sentiment analysis in the Spanish Language. Data Technol Appl. 2021;55(4):461\u201379. https:\/\/doi.org\/10.1108\/DTA-09-2020-0200.","journal-title":"Data Technol Appl"},{"key":"1186_CR83","doi-asserted-by":"crossref","unstructured":"Pang B, Lee L. (2004). A sentimental education: Sentiment analysis using subjectivity summarization based on minimum cuts. Proceedings of the 42nd annual meeting on Association for Computational Linguistics.","DOI":"10.3115\/1218955.1218990"},{"issue":"1","key":"1186_CR84","doi-asserted-by":"publisher","first-page":"17","DOI":"10.1016\/j.ijforecast.2017.08.002","volume":"34","author":"T Peeters","year":"2018","unstructured":"Peeters T. Testing the wisdom of crowds in the field: transfermarkt valuations and international soccer results. Int J Forecast. 2018;34(1):17\u201329. https:\/\/doi.org\/10.1016\/j.ijforecast.2017.08.002.","journal-title":"Int J Forecast"},{"key":"1186_CR85","doi-asserted-by":"publisher","first-page":"110551","DOI":"10.1016\/j.knosys.2023.110551","volume":"272","author":"N Ratner","year":"2023","unstructured":"Ratner N, Kagan E, Kumar P, Ben-Gal I. Unsupervised classification for uncertain varying responses: the wisdom-in-the-crowd (WICRO) algorithm. Knowl Based Syst. 2023;272:110551.","journal-title":"Knowl Based Syst"},{"key":"1186_CR86","doi-asserted-by":"publisher","first-page":"102874","DOI":"10.1016\/j.ijhm.2021.102874","volume":"94","author":"J Ren","year":"2021","unstructured":"Ren J, Raghupathi V, Raghupathi W. Effect of crowd wisdom on pricing in the asset-based sharing platform: an attribute substitution perspective. Int J Hospitality Manage. 2021;94:102874. https:\/\/doi.org\/10.1016\/j.ijhm.2021.102874.","journal-title":"Int J Hospitality Manage"},{"key":"1186_CR87","unstructured":"Sauri R. (2008). A Factuality Profiler for Eventualities in Text Brandeis University]. Waltham, MA."},{"issue":"1","key":"1186_CR88","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1086\/658070","volume":"38","author":"JP Simmons","year":"2011","unstructured":"Simmons JP, Nelson LD, Galak J, Frederick S. Intuitive biases in choice versus estimation: implications for the wisdom of crowds. J Consum Res. 2011;38(1):1\u201315.","journal-title":"J Consum Res"},{"key":"1186_CR89","unstructured":"Skalak DB. (1996). The Sources of Increased Accuracy for Two Proposed Boosting Algorithms. AAAI Conference on Artificial Intelligence, Portland (OR)."},{"key":"1186_CR90","volume-title":"Combining Lexicon-and Learning-based approaches for improved performance and convenience in sentiment classification","author":"F Sommar","year":"2015","unstructured":"Sommar F, Wielondek M. Combining Lexicon-and Learning-based approaches for improved performance and convenience in sentiment classification. In. Stockholm, Sweden: CSC, KTH; 2015."},{"key":"1186_CR91","unstructured":"Stone PJ, Dunphy DC, Smith MS. The general inquirer: A computer approach to content analysis. M.I.T.; 1966."},{"key":"1186_CR92","unstructured":"Surowiecki J. The wisdom of crowds. Anchor Books; 2005."},{"issue":"2","key":"1186_CR93","doi-asserted-by":"publisher","first-page":"267","DOI":"10.1162\/COLI_a_00049","volume":"37","author":"M Taboada","year":"2011","unstructured":"Taboada M, Brooke J, Tofiloski M, Voll K, Stede M. Lexicon-Based methods for sentiment analysis. Comput Linguistics. 2011;37(2):267\u2013307.","journal-title":"Comput Linguistics"},{"key":"1186_CR94","doi-asserted-by":"crossref","unstructured":"Tan S, Wang Y, Cheng X. (2008). Combining learn-based and lexicon-based techniques for sentiment detection without using labeled examples. Proceedings of the 31st annual international ACM SIGIR conference on Research and development in information retrieval.","DOI":"10.1145\/1390334.1390481"},{"issue":"6","key":"1186_CR95","doi-asserted-by":"publisher","first-page":"823","DOI":"10.1177\/0165551510388123","volume":"36","author":"TT Thet","year":"2010","unstructured":"Thet TT, Na J-C, Khoo CSG. Aspect-based sentiment analysis of movie reviews on discussion boards. J Inform Sci. 2010;36(6):823\u201348.","journal-title":"J Inform Sci"},{"issue":"13","key":"1186_CR96","doi-asserted-by":"publisher","first-page":"2760","DOI":"10.3390\/app9132760","volume":"9","author":"TK Tran","year":"2019","unstructured":"Tran TK, Phan TT. Deep learning application to ensemble learning\u2014The simple, but effective, approach to sentiment classifying. Appl Sci. 2019;9(13):2760.","journal-title":"Appl Sci"},{"key":"1186_CR97","doi-asserted-by":"crossref","unstructured":"Turney PD. (2002). Thumbs up or thumbs down? Semantic orientation applied to unsupervised classification of reviews. 40th Annual Meeting on Association for Computational Linguistics, Stroudsburg, PA.","DOI":"10.3115\/1073083.1073153"},{"issue":"1","key":"1186_CR98","doi-asserted-by":"publisher","first-page":"88","DOI":"10.1177\/10944281221124947","volume":"27","author":"L Valtonen","year":"2024","unstructured":"Valtonen L, M\u00e4kinen SJ, Kirjavainen J. Advancing reproducibility and accountability of unsupervised machine learning in text mining: importance of transparency in reporting preprocessing and algorithm selection. Organizational Res Methods. 2024;27(1):88\u2013113.","journal-title":"Organizational Res Methods"},{"issue":"3","key":"1186_CR99","doi-asserted-by":"publisher","first-page":"75","DOI":"10.1007\/s10462-024-10988-9","volume":"58","author":"Z Wang","year":"2025","unstructured":"Wang Z, Huang D, Cui J, Zhang X, Ho S-B, Cambria E. A review of Chinese sentiment analysis: subjects, methods, and trends. Artif Intell Rev. 2025;58(3):75. https:\/\/doi.org\/10.1007\/s10462-024-10988-9.","journal-title":"Artif Intell Rev"},{"key":"1186_CR100","unstructured":"Wertz J. (2018). Why Sentiment Analysis Could Be Your Best Kept Marketing Secret. Retrieved 07\/14\/2021, from https:\/\/www.forbes.com\/sites\/jiawertz\/2018\/11\/30\/why-sentiment-analysis-could-be-your-best-kept-marketing-secret\/?sh=6bfa2a352bbe"},{"issue":"2","key":"1186_CR101","doi-asserted-by":"publisher","first-page":"165","DOI":"10.1007\/s10579-005-7880-9","volume":"39","author":"J Wiebe","year":"2005","unstructured":"Wiebe J, Wilson T, Cardie C. Annotating expressions of opinions and emotions in Language. Lang Resour Evaluation. 2005;39(2):165\u2013210.","journal-title":"Lang Resour Evaluation"},{"key":"1186_CR102","doi-asserted-by":"crossref","unstructured":"Wilcoxon F. Individual comparisons by ranking methods. Breakthroughs in statistics: methodology and distribution. Springer; 1992. pp. 196\u2013202.","DOI":"10.1007\/978-1-4612-4380-9_16"},{"issue":"3","key":"1186_CR103","doi-asserted-by":"publisher","first-page":"839","DOI":"10.1007\/s10579-018-9416-0","volume":"52","author":"L Wu","year":"2018","unstructured":"Wu L, Morstatter F, Liu H. SlangSD: building, expanding and using a sentiment dictionary of slang words for short-text sentiment classification. Lang Resour Evaluation. 2018;52(3):839\u201352.","journal-title":"Lang Resour Evaluation"},{"issue":"3","key":"1186_CR104","doi-asserted-by":"publisher","first-page":"452","DOI":"10.1111\/j.1551-6709.2011.01223.x","volume":"36","author":"SKM Yi","year":"2012","unstructured":"Yi SKM, Steyvers M, Lee MD, Dry MJ. The wisdom of the crowd in combinatorial problems. Cogn Sci. 2012;36(3):452\u201370.","journal-title":"Cogn Sci"},{"issue":"252\u2013261","key":"1186_CR105","first-page":"257","volume":"194","author":"GU Yule","year":"1900","unstructured":"Yule GU, Pearson K. VII. On the association of attributes in statistics: with illustrations from the material of the childhood society, &c. Philosophical Trans Royal Soc Lond Ser Containing Papers Math or Phys Character. 1900;194(252\u2013261):257\u2013319.","journal-title":"Philosophical Trans Royal Soc Lond Ser Containing Papers Math or Phys Character"},{"issue":"1","key":"1186_CR106","doi-asserted-by":"publisher","first-page":"35","DOI":"10.1186\/s40537-023-00710-x","volume":"10","author":"H Zou","year":"2023","unstructured":"Zou H, Wang Z. A semi-supervised short text sentiment classification method based on improved Bert model from unlabelled data. J Big Data. 2023;10(1):35. https:\/\/doi.org\/10.1186\/s40537-023-00710-x.","journal-title":"J Big Data"}],"container-title":["Journal of Big Data"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s40537-025-01186-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1186\/s40537-025-01186-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1186\/s40537-025-01186-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,5,23]],"date-time":"2025-05-23T19:03:27Z","timestamp":1748027007000},"score":1,"resource":{"primary":{"URL":"https:\/\/journalofbigdata.springeropen.com\/articles\/10.1186\/s40537-025-01186-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,5,23]]},"references-count":106,"journal-issue":{"issue":"1","published-online":{"date-parts":[[2025,12]]}},"alternative-id":["1186"],"URL":"https:\/\/doi.org\/10.1186\/s40537-025-01186-7","relation":{"references":[{"id-type":"doi","id":"10.2307\/41703503","asserted-by":"subject"}]},"ISSN":["2196-1115"],"issn-type":[{"value":"2196-1115","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,5,23]]},"assertion":[{"value":"22 October 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"12 May 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"23 May 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"Not applicable.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethics approval and consent to participate"}},{"value":"Not applicable.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Consent for publication"}},{"value":"The authors declare no competing interests.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Competing interests"}}],"article-number":"129"}}