{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,26]],"date-time":"2026-03-26T07:41:00Z","timestamp":1774510860724,"version":"3.50.1"},"reference-count":35,"publisher":"Springer Science and Business Media LLC","issue":"1","license":[{"start":{"date-parts":[[2022,11,8]],"date-time":"2022-11-08T00:00:00Z","timestamp":1667865600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2022,11,8]],"date-time":"2022-11-08T00:00:00Z","timestamp":1667865600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Iran J Comput Sci"],"published-print":{"date-parts":[[2023,3]]},"DOI":"10.1007\/s42044-022-00124-7","type":"journal-article","created":{"date-parts":[[2022,11,8]],"date-time":"2022-11-08T19:04:33Z","timestamp":1667934273000},"page":"81-94","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":9,"title":["Semantic similarity measure for topic modeling using latent Dirichlet allocation and collapsed Gibbs sampling"],"prefix":"10.1007","volume":"6","author":[{"given":"Micheal Olalekan","family":"Ajinaja","sequence":"first","affiliation":[]},{"given":"Adebayo Olusola","family":"Adetunmbi","sequence":"additional","affiliation":[]},{"given":"Chukwuemeka Christian","family":"Ugwu","sequence":"additional","affiliation":[]},{"given":"Olugbemiga Solomon","family":"Popoola","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,11,8]]},"reference":[{"issue":"6","key":"124_CR1","doi-asserted-by":"publisher","first-page":"391","DOI":"10.1002\/(SICI)1097-4571(199009)41:6<391::AID-ASI1>3.0.CO;2-9","volume":"41","author":"S Deerwester","year":"1990","unstructured":"Deerwester, S., Dumais, S.T., Furnas, G.W., Landauer, T.K., Harshman, R.: Indexing by latent semantic analysis. J. Am. Soc. Inf. Sci. 41(6), 391 (1990)","journal-title":"J. Am. Soc. Inf. Sci."},{"key":"124_CR2","doi-asserted-by":"publisher","first-page":"101582","DOI":"10.1016\/j.is.2020.101582","volume":"94","author":"I Vayansky","year":"2020","unstructured":"Vayansky, I., Kumar, S.A.P.: A review of topic modeling methods. Inform. Syst. 94, 101582 (2020). https:\/\/doi.org\/10.1016\/j.is.2020.101582","journal-title":"Inform. Syst."},{"issue":"3","key":"124_CR3","doi-asserted-by":"publisher","first-page":"1427","DOI":"10.1109\/TKDE.2020.2992485","volume":"34","author":"J Qiang","year":"2022","unstructured":"Qiang, J., Qian, Z., Li, Y., Yuan, Y., Wu, X.: Short text topic modeling techniques, applications, and performance: a survey. IEEE Trans Knowl Data Eng 34(3), 1427\u20131445 (2022). https:\/\/doi.org\/10.1109\/TKDE.2020.2992485","journal-title":"IEEE Trans Knowl Data Eng"},{"key":"124_CR4","doi-asserted-by":"publisher","first-page":"338","DOI":"10.1007\/978-3-642-20161-5_34","volume-title":"Advances in information retrieval","author":"WX Zhao","year":"2011","unstructured":"Zhao, W.X., Jiang, J., Weng, J., He, J., Lim, E.-P., Yan, H., Li, X.: Comparing Twitter and traditional media using topic models. In: Advances in information retrieval, pp. 338\u2013349. Springer (2011)"},{"key":"124_CR5","doi-asserted-by":"crossref","unstructured":"Ramage, D., Dumais, S., Liebling, D.: Characterizing microblogs with topic models, In: Fourth International AAAI Conference on Weblogs and social media (2010)","DOI":"10.1609\/icwsm.v4i1.14026"},{"key":"124_CR6","doi-asserted-by":"crossref","unstructured":"Dai, Z., Sun, A., Liu, X.-Y.: Crest: cluster-based representation enrichment for short text classification. In: Pacific\u2013Asia Conference on Knowledge Discovery and Data Mining, Springer, pp 256\u2013267 (2013)","DOI":"10.1007\/978-3-642-37456-2_22"},{"key":"124_CR7","doi-asserted-by":"crossref","unstructured":"Razavi, A. H., Inkpen, D.: Text representation using multi-level latent dirichlet allocation. In: Canadian Conference on Artificial Intelligence, Springer, pp 215\u2013226 (2014)","DOI":"10.1007\/978-3-319-06483-3_19"},{"key":"124_CR8","doi-asserted-by":"crossref","unstructured":"Lin, C. X., Zhao, B., Mei, Q., Han, J.: Pet: a statistical model for popular events tracking in social communities. In: Proceedings of the 16th ACM SIGKDD international conference on Knowledge discovery and data mining, ACM, pp 929\u2013938 (2010)","DOI":"10.1145\/1835804.1835922"},{"key":"124_CR9","doi-asserted-by":"crossref","unstructured":"Aggarwal, C.C., Subbian, K.: Event detection in social streams. In: Proceedings of the 2012 SIAM international conference on data mining, SIAM, pp. 624\u2013635 (2012)","DOI":"10.1137\/1.9781611972825.54"},{"key":"124_CR10","doi-asserted-by":"crossref","unstructured":"Ritter, A., Etzioni, O., Clark, S., et al.: Open domain event extraction from twitter. In: Proceedings of the 18th ACM SIGKDD international conference on Knowledge discovery and data mining, ACM, pp 1104\u20131112 (2012)","DOI":"10.1145\/2339530.2339704"},{"key":"124_CR11","doi-asserted-by":"crossref","unstructured":"Yin, H., Hu, Z., Zhou, X., Hao, W., Kai, Z., Nguyen, Q.V.H., Sadiq, S.: Discovering interpretable geo-social communities for user behavior prediction. In: 2016 IEEE 32nd International Conference on Data Engineering (ICDE) (2016)","DOI":"10.1109\/ICDE.2016.7498303"},{"key":"124_CR12","doi-asserted-by":"publisher","unstructured":"Goyal, A., Kashyap, I.: Latent Dirichlet Allocation\u2013An approach for topic discovery. In: 2022 International Conference on Machine Learning, Big Data, Cloud and Parallel Computing (COM-IT-CON), pp. 97\u2013102 (2022). https:\/\/doi.org\/10.1109\/COM-IT-CON54601.2022.9850912","DOI":"10.1109\/COM-IT-CON54601.2022.9850912"},{"key":"124_CR13","doi-asserted-by":"publisher","unstructured":"Barde, B. V., Bainwad, A. M.: An overview of topic modeling methods and tools. In: 2017 International Conference on Intelligent Computing and Control Systems (ICICCS), pp 745\u2013750 (2017) https:\/\/doi.org\/10.1109\/ICCONS.2017.8250563","DOI":"10.1109\/ICCONS.2017.8250563"},{"key":"124_CR14","doi-asserted-by":"publisher","unstructured":"Qin, D., Zheng, G., Liu, L., Li, L., Wang, Y., Zhao, L.: A knowledge search algorithm based on multidimensional semantic similarity analysis in knowledge graph systems of power grid networks. In: 2020 IEEE 20th International Conference on Communication Technology (ICCT), pp. 1447\u20131451 (2020) https:\/\/doi.org\/10.1109\/ICCT50939.2020.9295697","DOI":"10.1109\/ICCT50939.2020.9295697"},{"key":"124_CR15","first-page":"93","volume":"12","author":"Y Jiao","year":"2019","unstructured":"Jiao, Y., Jing, Ma., Kang, F.: Computing text semantic similarity with syntactic network of co-occurrence distance. Data Anal. Knowl. Discov. 12, 93\u2013100 (2019)","journal-title":"Data Anal. Knowl. Discov."},{"key":"124_CR16","doi-asserted-by":"publisher","unstructured":"Sheng, Q., Ying, G.: Measuring semantic similarity in ontology and its application in information retrieval. In: 2008 Congress on Image and Signal Processing, pp. 525\u2013529 (2008) https:\/\/doi.org\/10.1109\/CISP.2008.596","DOI":"10.1109\/CISP.2008.596"},{"key":"124_CR17","unstructured":"Newsgroup Master dataset. Retrieved from https:\/\/raw.githubusercontent.com\/selva86\/datasets\/master\/newsgroups.json"},{"key":"124_CR18","unstructured":"Hamed, J., Yongli, W., Chi, Y., Xia, F., Xiahui, J., Yanchao, L., Liang, Z.: Latent Dirichlet Allocation (LDA) and Topic modeling: models, applications, a survey. ArXiv.org e-print archive. (n.d.). https:\/\/arxiv.org\/ftp\/arxiv\/papers\/1310\/1310.8059.pdf. Retrieved 7 Aug 2022"},{"key":"124_CR19","doi-asserted-by":"publisher","DOI":"10.4108\/eai.13-7-2018.159623","author":"P Kherwa","year":"2019","unstructured":"Kherwa, P., Bansal, P.: Topic modelling: a comprehensive review. J. EAI Endorsed Trans. Scalable Inform. Syst. (2019). https:\/\/doi.org\/10.4108\/eai.13-7-2018.159623","journal-title":"J. EAI Endorsed Trans. Scalable Inform. Syst."},{"issue":"1","key":"124_CR20","doi-asserted-by":"publisher","first-page":"223","DOI":"10.4314\/njt.v38i1.27","volume":"38","author":"MA Adegoke","year":"2019","unstructured":"Adegoke, M.A., Ayeni, J.O., Adewole, P.A.: Empirical prior latent Dirichlet allocation model. Niger. J. Technol. (NIJOTECH). 38(1), 223\u2013232 (2019)","journal-title":"Niger. J. Technol. (NIJOTECH)."},{"issue":"4","key":"124_CR21","doi-asserted-by":"publisher","first-page":"1356","DOI":"10.1016\/j.ipm.2019.04.003","volume":"56","author":"M Mohamed","year":"2019","unstructured":"Mohamed, M., Oussalah, M.: SRL-ESA-TextSum: a text summarization approach based on semantic role labeling and explicit semantic analysis. Inform. Process. Manag. 56(4), 1356\u20131372 (2019)","journal-title":"Inform. Process. Manag."},{"key":"124_CR22","doi-asserted-by":"publisher","unstructured":"Sainani, A. et al.: Extracting and classifying requirements from software engineering contracts. In: 2020 IEEE 28th International Requirements Engineering Conference (RE) (2020) [Preprint]. https:\/\/doi.org\/10.1109\/re48521.2020.00026","DOI":"10.1109\/re48521.2020.00026"},{"key":"124_CR23","unstructured":"Jonsson, E., Stolee, J.: An evaluation of topic modelling techniques for twitter. An evaluation of topic modelling techniques for Twitter. (n.d.). https:\/\/www.cs.toronto.edu\/jstolee\/projects\/topic.pdf. Retrieved 7 Aug 2022"},{"key":"124_CR24","doi-asserted-by":"publisher","first-page":"93","DOI":"10.1186\/s40537-019-0255-7","volume":"6","author":"CB Asmussen","year":"2019","unstructured":"Asmussen, C.B., M\u00f8ller, C.: Smart literature review: a practical topic modelling approach to exploratory literature review. J. Big Data 6, 93 (2019). https:\/\/doi.org\/10.1186\/s40537-019-0255-7","journal-title":"J. Big Data"},{"issue":"24","key":"124_CR25","first-page":"27581","volume":"9","author":"D Akila","year":"2014","unstructured":"Akila, D., Jayakumar, C.: Semantic similarity\u2014a review of approaches and metrics. Int. J. Appl. Eng. Res. 9(24), 27581\u201327600 (2014)","journal-title":"Int. J. Appl. Eng. Res."},{"key":"124_CR26","unstructured":"Sontag, D., Roy, D.M.: Complexity of inference in latent Dirichlet allocation. (2022). https:\/\/people.csail.mit.edu\/dsontag\/papers\/SontagRoy_nips11.pdf. Accessed: 31 Oct 2022"},{"key":"124_CR27","doi-asserted-by":"publisher","first-page":"207","DOI":"10.1016\/j.procs.2019.11.277","volume":"162","author":"JC Bail\u00f3n-Elvira","year":"2019","unstructured":"Bail\u00f3n-Elvira, J.C., Cobo, M.J., Herrera-Viedma, E., L\u00f3pez-Herrera, A.G.: Latent Dirichlet allocation (LDA) for improving the topic modeling of the official bulletin of the Spanish state (BOE). Procedia Comput. Sci. 162, 207\u2013214 (2019)","journal-title":"Procedia Comput. Sci."},{"key":"124_CR28","doi-asserted-by":"publisher","DOI":"10.3390\/ai2020011","volume-title":"Latent Dirichlet allocation and t-distributed stochastic neighbor embedding enhance scientific reading comprehension of articles related to enterprise architecture","author":"N Horn","year":"2021","unstructured":"Horn, N., Gampfer, F., Buchkremer, R.: Latent Dirichlet allocation and t-distributed stochastic neighbor embedding enhance scientific reading comprehension of articles related to enterprise architecture. Institute of IT Management and Digitization Research (IFID) (2021)"},{"key":"124_CR29","unstructured":"Anima A. et al.: A spectral algorithm for latent Dirichlet allocation. Retrieved from https:\/\/www.cs.columbia.edu\/~djhsu\/papers\/lda-nips.pdf"},{"key":"124_CR30","unstructured":"Lei, S., Griffiths, T.L., Kevin, R.C.: Online inference of topics with latent Dirichlet allocation. In: 2th International Conference on Artificial Intelligence and Statistics (AISTATS) vol. 5 (2009)"},{"key":"124_CR31","doi-asserted-by":"publisher","first-page":"38","DOI":"10.1016\/j.neunet.2014.05.008","volume":"58","author":"A Gross","year":"2014","unstructured":"Gross, A., Murthy, D.: Modeling virtual organizations with latent Dirichlet allocation: a case for natural language processing. J. Neural Netw. 58, 38\u201349 (2014)","journal-title":"J. Neural Netw."},{"key":"124_CR32","unstructured":"\u0160peh, J., Muhic, J., Rupnik, J.: Parameter estimation for the Latent Dirichlet Allocation. Retrieved from https:\/\/ailab.ijs.si\/dunja\/SiKDD2013\/Papers\/Speh-ldaAlgorithms.pdf"},{"key":"124_CR33","unstructured":"Zhe, C., Dossaca, H.. Inference for the number of topics in the Latent Dirichlet allocation model via Bayesian mixture modelling. Retrieved from https:\/\/users.stat.ufl.edu\/~doss\/Research\/lda-ntopics.pdf"},{"key":"124_CR34","doi-asserted-by":"crossref","unstructured":"Foster, A., Li, H., Maierhofer, G., Shearer, M.: An extension of standard latent dirichlet allocation to multiple corpora. Retrieved on April 2016 from http:\/\/evoq-eval.siam.org\/Portals\/0\/Publications\/SIURO\/Vol9\/AN_EXTENSION_STANDARD_LATENT_DIRICHLET_ALLOCATION.pdf?ver=2018-04-06-152049-177","DOI":"10.1137\/15S014599"},{"key":"124_CR35","unstructured":"Hew, Z.J., Olanrewaju, V.J., Chew, X.Y., Khaw, K.W.: Text summarization for news articles by machine learning techniques. J. Appl. Math. Comput. Intell. (2022)"}],"container-title":["Iran Journal of Computer Science"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s42044-022-00124-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s42044-022-00124-7\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s42044-022-00124-7.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,2,16]],"date-time":"2023-02-16T17:19:20Z","timestamp":1676567960000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s42044-022-00124-7"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,11,8]]},"references-count":35,"journal-issue":{"issue":"1","published-print":{"date-parts":[[2023,3]]}},"alternative-id":["124"],"URL":"https:\/\/doi.org\/10.1007\/s42044-022-00124-7","relation":{},"ISSN":["2520-8438","2520-8446"],"issn-type":[{"value":"2520-8438","type":"print"},{"value":"2520-8446","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,11,8]]},"assertion":[{"value":"16 August 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"25 October 2022","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"8 November 2022","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors have no conflicts of interest to disclose about the article's content.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}