{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,7,24]],"date-time":"2025-07-24T11:32:21Z","timestamp":1753356741966,"version":"3.37.3"},"reference-count":31,"publisher":"Oxford University Press (OUP)","issue":"2","license":[{"start":{"date-parts":[[2024,4,3]],"date-time":"2024-04-03T00:00:00Z","timestamp":1712102400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/academic.oup.com\/pages\/standard-publication-reuse-rights"}],"funder":[{"DOI":"10.13039\/501100012325","name":"National Social Science Fund of China","doi-asserted-by":"publisher","award":["20&ZD140","19ZDA317","20AZD130","18BYY235"],"award-info":[{"award-number":["20&ZD140","19ZDA317","20AZD130","18BYY235"]}],"id":[{"id":"10.13039\/501100012325","id-type":"DOI","asserted-by":"publisher"}]},{"name":"MOE Project of Key Research Institute of Humanities and Social Sciences"},{"name":"Universities in China","award":["22JJD740018"],"award-info":[{"award-number":["22JJD740018"]}]},{"name":"Philosophy and Social Science Foundation of Henan Province","award":["2021BYY024"],"award-info":[{"award-number":["2021BYY024"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,6,1]]},"abstract":"<jats:title>Abstract<\/jats:title>\n               <jats:p>Since the Internet is a breeding ground for unconfirmed fake news, its automatic detection and clustering studies have become crucial. Most current studies focus on English texts, and the common features of multilingual fake news are not sufficiently studied. Therefore, this article uses English, Russian, and Chinese as examples and focuses on identifying the common quantitative features of fake news in different languages at the word, sentence, readability, and sentiment levels. These features are then utilized in principal component analysis, K-means clustering, hierarchical clustering, and two-step clustering experiments, which achieved satisfactory results. The common features we proposed play a greater role in achieving automatic cross-lingual clustering than the features proposed in previous studies. Simultaneously, we discovered a trend toward linguistic simplification and economy in fake news. Furthermore, fake news is easier to understand and uses negative emotional expressions in ways that real news does not. Our research provides new reference features for fake news detection tasks and facilitates research into their linguistic characteristics.<\/jats:p>","DOI":"10.1093\/llc\/fqae016","type":"journal-article","created":{"date-parts":[[2024,4,3]],"date-time":"2024-04-03T10:25:53Z","timestamp":1712139953000},"page":"790-804","source":"Crossref","is-referenced-by-count":2,"title":["Finding common features in multilingual fake news: a quantitative clustering approach"],"prefix":"10.1093","volume":"39","author":[{"ORCID":"https:\/\/orcid.org\/0009-0004-2498-9447","authenticated-orcid":false,"given":"Wei","family":"Yuan","sequence":"first","affiliation":[{"name":"School of International Relations, National University of Defense Technology , Nanjing, 210039, China"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1724-4418","authenticated-orcid":false,"given":"Haitao","family":"Liu","sequence":"additional","affiliation":[{"name":"Institute of Quantitative Linguistics, Beijing Language and Culture University , Beijing, 100083, China"},{"name":"Center for Linguistics and Applied Linguistics, Guangdong University of Foreign Studies , Guangzhou, 510420, China"},{"name":"Department of Linguistics, Zhejiang University , Hangzhou, 310058, China"}]}],"member":"286","published-online":{"date-parts":[[2024,4,3]]},"reference":[{"key":"2024061809544990400_fqae016-B1","doi-asserted-by":"crossref","first-page":"87","DOI":"10.3390\/fi12050087","article-title":"Language-Independent Fake News Detection: English, Portuguese, and Spanish Mutual Features","volume":"12","author":"Abonizio","year":"2020","journal-title":"Future Internet"},{"key":"2024061809544990400_fqae016-B2","doi-asserted-by":"crossref","first-page":"211","DOI":"10.1257\/jep.31.2.211","article-title":"Social Media and Fake News in the 2016 Election","volume":"31","author":"Allcott","year":"2017","journal-title":"Journal of Economic Perspectives"},{"key":"2024061809544990400_fqae016-B3","doi-asserted-by":"crossref","first-page":"91","DOI":"10.1007\/3-540-44853-5_7","volume-title":"Proceedings of the 1st NSF\/NIJ Conference on Intelligence and Security Informatics","author":"Burgoon","year":"2003"},{"first-page":"208","year":"2017","author":"Buntain","key":"2024061809544990400_fqae016-B4"},{"first-page":"418","year":"2019","author":"Choshen","key":"2024061809544990400_fqae016-B5"},{"first-page":"310","year":"2021","author":"Dementieva","key":"2024061809544990400_fqae016-B6"},{"key":"2024061809544990400_fqae016-B7","doi-asserted-by":"crossref","first-page":"113503","DOI":"10.1016\/j.eswa.2020.113503","article-title":"Fake News Detection in Multiple Platforms and Languages","volume":"158","author":"Faustini","year":"2020","journal-title":"Expert Systems with Applications"},{"first-page":"171","year":"2012","author":"Feng","key":"2024061809544990400_fqae016-B8"},{"key":"2024061809544990400_fqae016-B9","doi-asserted-by":"crossref","first-page":"108432","DOI":"10.1016\/j.cie.2022.108432","article-title":"Linguistic Features Based Framework for Automatic Fake News Detection","volume":"172","author":"Garg","year":"2022","journal-title":"Computers and Industrial Engineering"},{"key":"2024061809544990400_fqae016-B10","doi-asserted-by":"crossref","first-page":"84","DOI":"10.22329\/il.v38i1.5068","article-title":"Fake News: A Definition","volume":"38","author":"Gelfert","year":"2018","journal-title":"Informal Log"},{"key":"2024061809544990400_fqae016-B11","doi-asserted-by":"crossref","first-page":"99","DOI":"10.1093\/llc\/fqac049","article-title":"Enriching Contextualized Semantic Representation with Textual Information Transmission for COVID-19 Fake News Detection: A Study on English and Persian","volume":"38","author":"Ghayoomi","year":"2022","journal-title":"Digital Scholarship in the Humanities"},{"key":"2024061809544990400_fqae016-B12","doi-asserted-by":"crossref","first-page":"10453","DOI":"10.1007\/s13369-021-06449-y","article-title":"Arabic Fake News Detection Based on Textual Analysis","volume":"47","author":"Himdi","year":"2022","journal-title":"Arabian Journal for Science and Engineering"},{"first-page":"759","year":"2017","author":"Horne","key":"2024061809544990400_fqae016-B13"},{"key":"2024061809544990400_fqae016-B14","doi-asserted-by":"crossref","first-page":"891","DOI":"10.1080\/17512786.2016.1163237","article-title":"Fake News: The Narrative Battle Over the Ukrainian Conflict","volume":"10","author":"Khaldarova","year":"2020","journal-title":"Journalism Practice"},{"first-page":"45","year":"2020","author":"Kuzmin","key":"2024061809544990400_fqae016-B15"},{"key":"2024061809544990400_fqae016-B16","doi-asserted-by":"crossref","first-page":"159","DOI":"10.17791\/jcs.2008.9.2.159","article-title":"Dependency Distance as a Metric of Language Comprehension Difficulty","volume":"9","author":"Liu","year":"2008","journal-title":"Journal of Cognitive Science"},{"key":"2024061809544990400_fqae016-B17","doi-asserted-by":"crossref","first-page":"123","DOI":"10.1080\/09296174.2014.882191","article-title":"Word Length Distribution in Mongolian","volume":"21","author":"Narisong","year":"2014","journal-title":"Journal of Quantitative Lingus"},{"issue":"6","key":"2024061809544990400_fqae016-B31","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3132039","article-title":"Surveying stylometry techniques and applications","volume":"50","author":"Neal","year":"2017","journal-title":"ACM Computing Surveys"},{"first-page":"3391","year":"2018","author":"P\u00e9rez-Rosas","key":"2024061809544990400_fqae016-B18"},{"key":"2024061809544990400_fqae016-B19","doi-asserted-by":"crossref","first-page":"490","DOI":"10.1609\/aaai.v34i01.5386","article-title":"Capturing the Style of Fake News","volume":"34","author":"Przybyla","year":"2020","journal-title":"Proceedings of the AAAI Conference on Artificial Intelligence"},{"first-page":"2931","year":"2017","author":"Rashkin","key":"2024061809544990400_fqae016-B20"},{"first-page":"755","year":"2018","author":"Rogers","key":"2024061809544990400_fqae016-B21"},{"key":"2024061809544990400_fqae016-B22","doi-asserted-by":"crossref","first-page":"379","DOI":"10.1093\/llc\/fqac023","article-title":"Multichannel Convolutional Neural Networks for Detecting COVID-19 Fake News","volume":"38","author":"Samadi","year":"2022","journal-title":"Digital Scholarship in the Humanities"},{"key":"2024061809544990400_fqae016-B23","doi-asserted-by":"crossref","first-page":"22","DOI":"10.1145\/3137597.3137600","article-title":"Fake news detection on social media: A data mining perspective","volume":"19","author":"Shu","year":"2017","journal-title":"ACM SIGKDD Exploration Newsletters"},{"key":"2024061809544990400_fqae016-B24","doi-asserted-by":"crossref","first-page":"132","DOI":"10.1007\/978-3-030-04497-8_11","volume-title":"Advances in Computational Intelligence: Vol. 11289","author":"Solnyshkina","year":"2018"},{"first-page":"3035","year":"2018","author":"Song","key":"2024061809544990400_fqae016-B25"},{"key":"2024061809544990400_fqae016-B27","doi-asserted-by":"crossref","first-page":"1146","DOI":"10.1126\/science.aap9559","article-title":"The Spread of True and False News Online","volume":"359","author":"Vosoughi","year":"2018","journal-title":"Science"},{"key":"2024061809544990400_fqae016-B28","first-page":"28","article-title":"Readability of Chinese Annual Reports: A Measure and Test","volume":"7","author":"Xu","year":"2021","journal-title":"China Journal of Accounting Studies"},{"key":"2024061809544990400_fqae016-B29","first-page":"363","article-title":"On Sentence-Length as a Statistical Characteristic of Style in Prose: With Application to Two Cases of Disputed Authorship","volume":"30","author":"Yule","year":"1939","journal-title":"Biometrika"},{"first-page":"2120","year":"2022","author":"Zhu","key":"2024061809544990400_fqae016-B32"},{"key":"2024061809544990400_fqae016-B30","doi-asserted-by":"crossref","first-page":"81","DOI":"10.1023\/B:GRUP.0000011944.62889.6f","article-title":"Automating Linguistics-Based Cues for Detecting Deception in Text-Based Asynchronous Computer-Mediated Communications","volume":"13","author":"Zhou","year":"2004","journal-title":"Group Decision and Negotiation"}],"container-title":["Digital Scholarship in the Humanities"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/academic.oup.com\/dsh\/article-pdf\/39\/2\/790\/58267418\/fqae016.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"syndication"},{"URL":"https:\/\/academic.oup.com\/dsh\/article-pdf\/39\/2\/790\/58267418\/fqae016.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,6,18]],"date-time":"2024-06-18T10:56:21Z","timestamp":1718708181000},"score":1,"resource":{"primary":{"URL":"https:\/\/academic.oup.com\/dsh\/article\/39\/2\/790\/7639473"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,4,3]]},"references-count":31,"journal-issue":{"issue":"2","published-online":{"date-parts":[[2024,4,3]]},"published-print":{"date-parts":[[2024,6,1]]}},"URL":"https:\/\/doi.org\/10.1093\/llc\/fqae016","relation":{},"ISSN":["2055-7671","2055-768X"],"issn-type":[{"type":"print","value":"2055-7671"},{"type":"electronic","value":"2055-768X"}],"subject":[],"published-other":{"date-parts":[[2024,6]]},"published":{"date-parts":[[2024,4,3]]}}}