{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,4,2]],"date-time":"2025-04-02T04:02:10Z","timestamp":1743566530759,"version":"3.40.3"},"publisher-location":"Cham","reference-count":88,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031861925","type":"print"},{"value":"9783031861932","type":"electronic"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-86193-2_4","type":"book-chapter","created":{"date-parts":[[2025,4,1]],"date-time":"2025-04-01T03:26:26Z","timestamp":1743477986000},"page":"44-73","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Applying Text Mining to\u00a0Analyze Human Question Asking in\u00a0Creativity Research"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-3407-7570","authenticated-orcid":false,"given":"Anna","family":"Wr\u00f2blewska","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Marceli","family":"Korbin","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3872-7689","authenticated-orcid":false,"given":"Yoed N.","family":"Kenett","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7251-7899","authenticated-orcid":false,"given":"Daniel","family":"Dan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7714-4844","authenticated-orcid":false,"given":"Maria","family":"Ganzha","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8069-2152","authenticated-orcid":false,"given":"Marcin","family":"Paprzycki","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,3,31]]},"reference":[{"key":"4_CR1","unstructured":"question, 2023, in dictionary.cambridge.org. https:\/\/dictionary.cambridge.org\/us\/dictionary\/english\/question. Accessed 8 Dec 2023"},{"key":"4_CR2","unstructured":"Different Types of Questions, Revolution Learning and Development. https:\/\/www.revolutionlearning.co.uk\/article\/different-types-of-questions\/. Accessed 9 Dec 2023"},{"key":"4_CR3","unstructured":"Miller, J.G.: 15 Reasons to Ask Questions, QBQ (2014). https:\/\/qbq.com\/15-reasons-to-ask-questions\/. Accessed 8 Dec 2023"},{"key":"4_CR4","unstructured":"Perel, E., Miller, M.A.: Letters from Esther #52: A Good Question Changes the Story, Esther Perel\u2019s Blog. https:\/\/www.estherperel.com\/blog\/letters-from-esther-52-a-good-question-changes-the-story. Accessed 26 Feb 2024"},{"issue":"1","key":"4_CR5","doi-asserted-by":"publisher","first-page":"26","DOI":"10.3390\/bdcc7010026","volume":"7","author":"G Sasson","year":"2023","unstructured":"Sasson, G., Kenett, Y.N.: A mirror to human question asking: analyzing the Akinator online question game. Big Data Cogn. Comput. 7(1), 26 (2023). https:\/\/doi.org\/10.3390\/bdcc7010026","journal-title":"Big Data Cogn. Comput."},{"key":"4_CR6","doi-asserted-by":"publisher","DOI":"10.1002\/jocb.671","author":"G Sasson","year":"2024","unstructured":"Sasson, G., Raz, T., Kenett, Y.N.: The art of creative inquiry-from question asking to prompt engineering. J. Creat. Behav. (2024). https:\/\/doi.org\/10.1002\/jocb.671","journal-title":"J. Creat. Behav."},{"key":"4_CR7","doi-asserted-by":"publisher","unstructured":"Raz, T., Reiter-Palmon, R., Kenett, Y.N.: The role of asking more complex questions in creative thinking, Psychol. Aesthetics, Creativity, Arts (2023). https:\/\/doi.org\/10.1037\/aca0000658","DOI":"10.1037\/aca0000658"},{"key":"4_CR8","unstructured":"Raz, T., Luchini, S., Beaty, R., Kenett, Y.: Bridging the measurement gap: a large language model method of assessing open-ended question complexity. In: Proceedings of the Annual Meeting of the Cognitive Science Society, vol. 46 (2024)"},{"key":"4_CR9","doi-asserted-by":"publisher","unstructured":"Acar, S.: Creativity assessment, research, and practice in the age of artificial intelligence, Creativity Res. J. (2023). https:\/\/doi.org\/10.1080\/10400419.2023.2271749","DOI":"10.1080\/10400419.2023.2271749"},{"key":"4_CR10","doi-asserted-by":"crossref","unstructured":"Mumford, M., Whetzel, D.L., Reiter-Palmon, R.: Thinking creatively at work: organization influences on creative problem solving, J. Creative Behav. 31(1), 7\u201317 (1997). https:\/\/onlinelibrary.wiley.com\/doi\/abs\/10.1002\/j.2162-6057.1997.tb00777.x","DOI":"10.1002\/j.2162-6057.1997.tb00777.x"},{"issue":"3","key":"4_CR11","doi-asserted-by":"crossref","first-page":"187","DOI":"10.1207\/s15326934crj1103_1","volume":"11","author":"R Reiter-Palmon","year":"1998","unstructured":"Reiter-Palmon, R., Mumford, M.D., Threlfall, K.V.: Solving everyday problems creatively: the role of problem construction and personality type. Creat. Res. J. 11(3), 187\u2013197 (1998)","journal-title":"Creat. Res. J."},{"key":"4_CR12","doi-asserted-by":"crossref","unstructured":"Tofade, T., Elsner, J., Haines, S.T.: Best practice strategies for effective use of questions as a teaching tool, Am. J. Pharm. Educ. 77(7) (2013). https:\/\/www.sciencedirect.com\/science\/article\/pii\/S0002945923029911","DOI":"10.5688\/ajpe777155"},{"key":"4_CR13","doi-asserted-by":"crossref","unstructured":"Adams, W.C.: Conducting semi-structured interviews, Handbook of practical program evaluation, pp.492\u2013505. Wiley Online Library (2015)","DOI":"10.1002\/9781119171386.ch19"},{"key":"4_CR14","doi-asserted-by":"publisher","first-page":"467","DOI":"10.1016\/j.sbspro.2012.09.302","volume":"59","author":"AM Daud","year":"2012","unstructured":"Daud, A.M., Omar, J., Turiman, P., Osman, K.: Creativity in science education. Procedia - Soc. Behav. Sci. 59, 467\u2013474 (2012). https:\/\/doi.org\/10.1016\/j.sbspro.2012.09.302","journal-title":"Procedia - Soc. Behav. Sci."},{"key":"4_CR15","doi-asserted-by":"crossref","unstructured":"Kenett, Y.N.: Assessing the role of associative abilities in creative thinking via behavioral, computational, and neuroscientific approaches, Handbook of Creativity Assessment, pp.182\u2013198. Edward Elgar Publishing (2024)","DOI":"10.4337\/9781839102158.00019"},{"key":"4_CR16","unstructured":"Anderson, L.W., Krathwohl, D.R., Bloom, B.S.: A taxonomy for learning, teaching, and assessing: a revision of bloom\u2019s taxonomy of educational objectives, Longman, New York (2000). isbn: 978-0-8013-1903-7"},{"key":"4_CR17","unstructured":"Rutka, J.: Bloom\u2019s Taxonomy Question Stems for Use in Assessment, Top Hat (2023). https:\/\/tophat.com\/blog\/blooms-taxonomy-question-stems. Accessed 9 Dec 2023"},{"key":"4_CR18","unstructured":"Bloom\u2019s Taxonomy. https:\/\/www.bloomstaxonomy.net. Accessed 9 Dec 2023"},{"key":"4_CR19","unstructured":"Trickey, S.: Bloom\u2019s Taxonomy, Teach With Mrs T (2020). https:\/\/www.teachwithmrst.com\/post\/bloom-s-taxonomy. Accessed 18 Dec 2023"},{"key":"4_CR20","volume-title":"Taxonomy of Educational Objectives: Handbook II: Affective Domain","author":"DR Krathwohl","year":"1964","unstructured":"Krathwohl, D.R., Bloom, B.S., Masia, B.B.: Taxonomy of Educational Objectives: Handbook II: Affective Domain. David McKay Co., New York (1964)"},{"key":"4_CR21","unstructured":"Simpson, E.J.: The Classification of Educational Objectives, Psychomotor Domain (1972)"},{"key":"4_CR22","unstructured":"Dr. Yoed Kenett - The brain is wired to adapt, survive, and evolve in complex environments. An interview with Y.N. Kenett, conducted by Sonophilia Foundation (2022). https:\/\/www.sonophiliafoundation.org\/dr-yoed-kenett-the-brain-is-wired-to-adapt-survive-and-evolve-in-complex-environments\/. Accessed 10 Dec 2023"},{"issue":"1","key":"4_CR23","doi-asserted-by":"crossref","first-page":"10","DOI":"10.1631\/FITEE.1700826","volume":"19","author":"H Shum","year":"2018","unstructured":"Shum, H., He, X., Li, D.: From Eliza to Xiaoice: challenges and opportunities with social chatbots. Front. Inf. Technol. Electron. Eng. 19(1), 10\u201326 (2018)","journal-title":"Front. Inf. Technol. Electron. Eng."},{"key":"4_CR24","doi-asserted-by":"crossref","unstructured":"Xu, Z., Howarth, A., Briggs, N., Cristianini, N.: What makes us curious? Analysis of a corpus of open-domain questions (2021). arXiv: 2110.15409. https:\/\/arxiv.org\/abs\/2110.15409","DOI":"10.5121\/csit.2021.112007"},{"key":"4_CR25","unstructured":"The story of Project What If, We the Curious. https:\/\/www.wethecurious.org\/projectwhatif. Accessed 14 Dec 2023"},{"key":"4_CR26","doi-asserted-by":"publisher","first-page":"35318","DOI":"10.1109\/ACCESS.2020.2974983","volume":"8","author":"D Buena\u00f1o-Fernandez","year":"2020","unstructured":"Buena\u00f1o-Fernandez, D., Gonz\u00e1lez, M., Gil, D., Luj\u00e1n-Mora, S.: Text mining of open-ended questions in self-assessment of university teachers: an LDA topic modeling approach. IEEE Access 8, 35318\u201335330 (2020). https:\/\/doi.org\/10.1109\/ACCESS.2020.2974983","journal-title":"IEEE Access"},{"key":"4_CR27","doi-asserted-by":"publisher","unstructured":"Gani, M.O., Ayyasamy, R.K., Sangodiah, A., Fui, Y.T.: Bloom\u2019s taxonomy-based exam question classification: the outcome of CNN and optimal pre-trained word embedding technique (2023). https:\/\/doi.org\/10.1007\/s10639-023-11842-1","DOI":"10.1007\/s10639-023-11842-1"},{"key":"4_CR28","unstructured":"Gani, M.O., Sangodiah, A.: Exam Question Datasets, Version 3 (2023). https:\/\/figshare.com\/articles\/dataset\/Exam_Question_Datasets\/22597957\/3"},{"key":"4_CR29","doi-asserted-by":"publisher","first-page":"587","DOI":"10.1016\/j.sbspro.2013.10.277","volume":"97","author":"AA Yahya","year":"2013","unstructured":"Yahya, A.A., Osman, A., Taleb, A., Alattab, A.A.: Analysing the cognitive level of classroom questions using machine learning techniques. Procedia. Soc. Behav. Sci. 97, 587\u2013595 (2013). https:\/\/doi.org\/10.1016\/j.sbspro.2013.10.277","journal-title":"Procedia. Soc. Behav. Sci."},{"issue":"4\u20132","key":"4_CR30","doi-asserted-by":"publisher","first-page":"1679","DOI":"10.18517\/ijaseit.8.4-2.6835","volume":"8","author":"M Mohammed","year":"2018","unstructured":"Mohammed, M., Omar, N.: Question classification based on bloom\u2019s taxonomy using enhanced TF-IDF international. J. Adv. Sci. Eng. Inf. Technol. 8(4\u20132), 1679\u20131685 (2018). https:\/\/doi.org\/10.18517\/ijaseit.8.4-2.6835","journal-title":"J. Adv. Sci. Eng. Inf. Technol."},{"issue":"3","key":"4_CR31","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1371\/journal.pone.0230442","volume":"15","author":"M Mohammed","year":"2020","unstructured":"Mohammed, M., Omar, N.: Question classification based on Bloom\u2019s taxonomy cognitive domain using modified TF-IDF and word2vec. PLoS ONE 15(3), 1\u201321 (2020). https:\/\/doi.org\/10.1371\/journal.pone.0230442","journal-title":"PLoS ONE"},{"issue":"2","key":"4_CR32","doi-asserted-by":"publisher","first-page":"1","DOI":"10.30935\/cedtech\/8341","volume":"12","author":"S Das","year":"2020","unstructured":"Das, S., Mandal, S.K.D., Basu, A.: Identification of cognitive learning complexity of assessment questions using multi-class text classification. Contemp. Educ. Technol. 12(2), 1\u201314 (2020). https:\/\/doi.org\/10.30935\/cedtech\/8341","journal-title":"Contemp. Educ. Technol."},{"key":"4_CR33","doi-asserted-by":"publisher","first-page":"117887","DOI":"10.1109\/ACCESS.2021.3106443","volume":"9","author":"S Shaikh","year":"2021","unstructured":"Shaikh, S., Daudpotta, S.M., Imran, A.S.: Bloom\u2019s learning outcomes\u2019 automatic classification using LSTM and pretrained word embeddings. IEEE Access 9, 117887\u2013117909 (2021). https:\/\/doi.org\/10.1109\/ACCESS.2021.3106443","journal-title":"IEEE Access"},{"issue":"5","key":"4_CR34","doi-asserted-by":"publisher","first-page":"5105","DOI":"10.1007\/s10639-022-11356-2","volume":"28","author":"H Sharma","year":"2022","unstructured":"Sharma, H., Mathur, R., Chintala, T., Dhanalakshmi, S., Senthil, R.: An effective deep learning pipeline for improved question classification into bloom\u2019s taxonomy\u2019s domains. Educ. Inf. Technol. 28(5), 5105\u20135145 (2022). https:\/\/doi.org\/10.1007\/s10639-022-11356-2","journal-title":"Educ. Inf. Technol."},{"issue":"1","key":"4_CR35","doi-asserted-by":"publisher","first-page":"121","DOI":"10.1007\/s40593-019-00186-y","volume":"30","author":"G Kurdi","year":"2019","unstructured":"Kurdi, G., Leo, J., Parsia, B., Sattler, U., Al-Emari, S.: A systematic review of automatic question generation for educational purposes. Int. J. Artif. Intell. Educ. 30(1), 121\u2013204 (2019). https:\/\/doi.org\/10.1007\/s40593-019-00186-y","journal-title":"Int. J. Artif. Intell. Educ."},{"issue":"2","key":"4_CR36","doi-asserted-by":"publisher","first-page":"94","DOI":"10.1080\/08832329709601623","volume":"73","author":"JD Hansen","year":"1997","unstructured":"Hansen, J.D., Dexter, L.: Quality multiple-choice test questions: item-writing guidelines and an analysis of auditing testbanks. J. Educ. Bus. 73(2), 94\u201397 (1997). https:\/\/doi.org\/10.1080\/08832329709601623","journal-title":"J. Educ. Bus."},{"issue":"6","key":"4_CR37","doi-asserted-by":"publisher","first-page":"354","DOI":"10.1016\/j.nepr.2006.07.002","volume":"6","author":"M Tarrant","year":"2006","unstructured":"Tarrant, M., Knierim, A., Hayes, S.K., Ware, J.: The frequency of item writing flaws in multiple-choice questions used in high stakes nursing assessments. Nurse Educ. Pract. 6(6), 354\u2013363 (2006). https:\/\/doi.org\/10.1016\/j.nepr.2006.07.002","journal-title":"Nurse Educ. Pract."},{"issue":"2","key":"4_CR38","first-page":"142","volume":"62","author":"MR Hingorjo","year":"2012","unstructured":"Hingorjo, M.R., Jaleel, F.: Analysis of one-best MCQs: the difficulty index, discrimination index and distractor efficiency. JPMA-J. Pakistan Med. Assoc. 62(2), 142 (2012)","journal-title":"JPMA-J. Pakistan Med. Assoc."},{"key":"4_CR39","doi-asserted-by":"publisher","first-page":"250","DOI":"10.1186\/s12909-016-0773-3","volume":"16","author":"BR Rush","year":"2016","unstructured":"Rush, B.R., Rankin, D.C., White, B.J.: The impact of item-writing flaws and item complexity on examination item difficulty and discrimination value. BMC Med. Educ. 16, 250 (2016). https:\/\/doi.org\/10.1186\/s12909-016-0773-3","journal-title":"BMC Med. Educ."},{"key":"4_CR40","doi-asserted-by":"publisher","unstructured":"McCarthy, P.M., Jarvis, S.: MTLD, vocd-D, and HD-D: a validation study of sophisticated approaches to lexical diversity assessment (2010). https:\/\/doi.org\/10.3758\/BRM.42.2.381","DOI":"10.3758\/BRM.42.2.381"},{"key":"4_CR41","doi-asserted-by":"crossref","first-page":"323","DOI":"10.1023\/A:1001749303137","volume":"32","author":"FJ Tweedie","year":"1998","unstructured":"Tweedie, F.J., Baayen, R.H.: How variable may a constant be? Measures of lexical richness in perspective. Comput. Humanit. 32, 323\u2013352 (1998)","journal-title":"Comput. Humanit."},{"key":"4_CR42","doi-asserted-by":"publisher","first-page":"372","DOI":"10.22363\/2618-897X-2018-15-3-372-380","volume":"15","author":"O Vinogradova","year":"2018","unstructured":"Vinogradova, O.: Automated vocabulary evaluation in a learner corpus. Polylinguality Transcult. Pract. 15, 372\u2013380 (2018). https:\/\/doi.org\/10.22363\/2618-897X-2018-15-3-372-380","journal-title":"Polylinguality Transcult. Pract."},{"key":"4_CR43","doi-asserted-by":"crossref","unstructured":"Templin, M.C.: Certain Language Skills in Children; Their Development and Interrelationships. University of Minnesota Press (1957)","DOI":"10.5749\/j.ctttv2st"},{"issue":"3","key":"4_CR44","doi-asserted-by":"publisher","first-page":"441","DOI":"10.1287\/mksc.2022.1354","volume":"41","author":"M Reisenbichler","year":"2022","unstructured":"Reisenbichler, M., Reutterer, T., Schweidel, D.A., Dan, D.: Frontiers: supporting content marketing with natural language generation. Mark. Sci. 41(3), 441\u2013452 (2022). https:\/\/doi.org\/10.1287\/mksc.2022.1354","journal-title":"Mark. Sci."},{"issue":"7","key":"4_CR45","doi-asserted-by":"publisher","first-page":"3726","DOI":"10.3758\/s13428-022-01986-2","volume":"55","author":"DR Johnson","year":"2022","unstructured":"Johnson, D.R., et al.: Divergent semantic integration (DSI): extracting creativity from narratives with distributional semantic modeling. Behav. Res. Methods 55(7), 3726\u20133759 (2022). https:\/\/doi.org\/10.3758\/s13428-022-01986-2","journal-title":"Behav. Res. Methods"},{"key":"4_CR46","doi-asserted-by":"publisher","unstructured":"Yu, Y., et al.: A MAD method to assess idea novelty: improving validity of automatic scoring using maximum associative distance (MAD), Psychol. Aesthetics, Creativity, Arts (2023). https:\/\/doi.org\/10.1037\/aca0000573","DOI":"10.1037\/aca0000573"},{"key":"4_CR47","doi-asserted-by":"publisher","unstructured":"Xia, M., Kochmar, E., Briscoe, T.: Text readability assessment for second language learners, In: Proceedings of the 11th Workshop on Innovative Use of NLP for Building Educational Applications, pp. 12\u201322. Association for Computational Linguistics, San Diego (2016). https:\/\/doi.org\/10.18653\/v1\/W16-0502","DOI":"10.18653\/v1\/W16-0502"},{"key":"4_CR48","unstructured":"Flesch, R.: How to Write Plain English: a Book for Lawyers and Consumers, University of Canterbury (1979)"},{"key":"4_CR49","doi-asserted-by":"crossref","unstructured":"Kincaid, J.P., et al.: Derivation of new readability formulas (Automated Readability Index, Fog Count and Flesch Reading Ease Formula) for Navy enlisted personnel, Research Branch Report 8\u201375, Millington, TN: Naval Technical Training, U. S. Naval Air Station, Memphis, TN (1975). https:\/\/apps.dtic.mil\/sti\/pdfs\/ADA006655.pdf","DOI":"10.21236\/ADA006655"},{"key":"4_CR50","unstructured":"Hussin, A.A.: Refining the Flesch Reading Ease Formula for Intermediate and High-Intermediate ESL Learners (2015)"},{"key":"4_CR51","unstructured":"Senter, R.J., Smith, E.A.: Automated Readability Index (1967)"},{"key":"4_CR52","unstructured":"What is Natural Language Processing?, Coursera (2023). https:\/\/www.coursera.org\/articles\/natural-language-processing. Accessed 16 Dec 2023"},{"key":"4_CR53","unstructured":"Mikolov, T., Chen, K., Corrado, G., Dean, J.: Efficient Estimation of Word Representations in Vector Space (2013). arXiv: 1301.3781. https:\/\/arxiv.org\/abs\/1301.3781"},{"key":"4_CR54","unstructured":"Peters, M.E., et al.: Deep contextualized word representations (2018). arXiv: 1802.05365. https:\/\/arxiv.org\/abs\/1802.05365"},{"key":"4_CR55","doi-asserted-by":"publisher","first-page":"1532","DOI":"10.3115\/v1\/D14-1162","volume":"D14\u20131162","author":"J Pennington","year":"2014","unstructured":"Pennington, J., Socher, R., Manning, C.: GloVe: global vectors for word representation. Assoc. Comput. Linguist. D14\u20131162, 1532\u20131543 (2014). https:\/\/doi.org\/10.3115\/v1\/D14-1162","journal-title":"Assoc. Comput. Linguist."},{"key":"4_CR56","unstructured":"Serrano, L.: What are word and sentence embeddings?, Cohere Blog (2023). https:\/\/txt.cohere.com\/sentence-word-embeddings\/. Accessed 17 Dec 2023"},{"key":"4_CR57","unstructured":"Vaswani, A., et al.: Attention is all you need (2017). arXiv: 1706.03762. https:\/\/arxiv.org\/abs\/1706.03762"},{"key":"4_CR58","unstructured":"Devlin, J., Chang, M.-W., Lee, K., Toutanova, K.: BERT: pre-training of deep bidirectional transformers for language understanding (2018). arXiv: 1810.04805. https:\/\/arxiv.org\/abs\/1810.04805"},{"key":"4_CR59","unstructured":"Gundapu, S., Mamidi, R.: Transformer based automatic COVID-19 fake news detection system (2021). 2101.00180. https:\/\/arxiv.org\/abs\/2101.00180"},{"key":"4_CR60","unstructured":"Zhuang, F., et al.: A comprehensive survey on transfer learning (2019). arXiv: 1911.02685. https:\/\/arxiv.org\/abs\/1911.02685"},{"key":"4_CR61","doi-asserted-by":"crossref","unstructured":"Reimers, N., Gurevych, I.: Sentence-BERT: sentence embeddings using siamese BERT-networks (2019). arXiv: 1908.10084. https:\/\/arxiv.org\/abs\/1908.10084","DOI":"10.18653\/v1\/D19-1410"},{"key":"4_CR62","unstructured":"SentenceTransformers Documentation. https:\/\/sbert.net\/index.html"},{"key":"4_CR63","unstructured":"Liu, Y., et al.: RoBERTa: a robustly optimized BERT pretraining approach (2019). arXiv: 1907.11692. https:\/\/arxiv.org\/abs\/1907.11692"},{"key":"4_CR64","unstructured":"Sanh, V., Debut, L., Chaumond, J., Wolf, T.: DistilBERT, a distilled version of BERT: smaller, faster, cheaper and lighter (2019). arXiv: 1910.01108. https:\/\/arxiv.org\/abs\/1910.01108"},{"key":"4_CR65","unstructured":"Wang, W., et al.: MiniLM: deep self-attention distillation for task-agnostic compression of pre-trained transformers (2020). arXiv: 2002.10957. https:\/\/arxiv.org\/abs\/2002.10957"},{"key":"4_CR66","unstructured":"Song, K., et al.: MPNet: masked and permuted pre-training for language understanding (2020). arXiv: 2004.09297v2. https:\/\/arxiv.org\/abs\/2004.09297v2"},{"key":"4_CR67","unstructured":"Yang, Z., et al.: XLnet: generalized autoregressive pretraining for language understanding (2019)"},{"key":"4_CR68","unstructured":"Radford, A., Narasimhan, K.: Improving language understanding by generative pre-training (2018)"},{"key":"4_CR69","unstructured":"Radford, A., Wu, J., Child, R., Luan, D., Amodei, D., Sutskever, I.: Language models are unsupervised multitask learners (2019)"},{"key":"4_CR70","unstructured":"Brown, T.B., et al.: Language models are few-shot learners (2020). arXiv: 2005.14165. https:\/\/arxiv.org\/abs\/2005.14165"},{"key":"4_CR71","unstructured":"OpenAI, GPT-4 Technical report (2023). arXiv: 2303.08774. https:\/\/arxiv.org\/abs\/2303.08774"},{"key":"4_CR72","unstructured":"Toews, R.: The Next Generation of Large Language Models, Forbes (2023). https:\/\/www.forbes.com\/sites\/robtoews\/2023\/02\/07\/the-next-generation-of-large-language-models. Accessed 18 Dec 2023"},{"key":"4_CR73","unstructured":"Newman, D.: Exploring the ins and outs of the generative AI boom, Forbes (2023). www.forbes.com\/sites\/danielnewman\/2023\/03\/14\/exploring-the-ins-and-outs-of-the-generative-ai-boom. Accessed 18 Dec 2023"},{"key":"4_CR74","doi-asserted-by":"crossref","unstructured":"Blei, D.M., Lafferty, J.D.: Topic Models, Text Mining, pp. 101\u2013124. Chapman and Hall\/CRC (2009). https:\/\/www.cs.columbia.edu\/~blei\/papers\/BleiLafferty2009.pdf","DOI":"10.1201\/9781420059458.ch4"},{"key":"4_CR75","unstructured":"Sheridan, S.: What is topic modelling? A beginner\u2019s guide, Levity Blog (2022). https:\/\/levity.ai\/blog\/what-is-topic-modeling Accessed 11 Dec 2023"},{"issue":"1","key":"4_CR76","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s40064-016-3252-8","volume":"5","author":"L Liu","year":"2016","unstructured":"Liu, L., Tang, L., Dong, W., Yao, S., Zhou, W.: An overview of topic modeling and its current applications in bioinformatics. Springerplus 5(1), 1\u201322 (2016). https:\/\/doi.org\/10.1186\/s40064-016-3252-8","journal-title":"Springerplus"},{"issue":"2","key":"4_CR77","doi-asserted-by":"publisher","first-page":"945","DOI":"10.1093\/genetics\/155.2.945","volume":"155","author":"JK Pritchard","year":"2000","unstructured":"Pritchard, J.K., Stephens, M., Donnelly, P.: Inference of population structure using multilocus genotype data. Genetics 155(2), 945\u2013959 (2000). https:\/\/doi.org\/10.1093\/genetics\/155.2.945","journal-title":"Genetics"},{"key":"4_CR78","unstructured":"Blei, D.M., Ng, A.Y., Jordan, M.I.: Latent dirichlet allocation. J. Mach. Learn. Res. 3, 993\u20131022 (2003). https:\/\/www.jmlr.org\/papers\/volume3\/blei03a\/blei03a.pdf"},{"key":"4_CR79","doi-asserted-by":"publisher","first-page":"2278","DOI":"10.3390\/su10072278","volume":"10","author":"J Lee","year":"2018","unstructured":"Lee, J., Kang, J., Jun, S., Lim, H., Jang, D., Park, S.: Ensemble modeling for sustainable technology transfer. Sustainability 10, 2278 (2018). https:\/\/doi.org\/10.3390\/su10072278","journal-title":"Sustainability"},{"key":"4_CR80","unstructured":"Zhang, Y., Zhang, Y., Michalski, M., Jiang, Y., Meng, Y., Han, J.: Effective seed-guided topic discovery by integrating multiple types of contexts (20230. arXiv: 2212.06002. https:\/\/arxiv.org\/abs\/2212.06002"},{"key":"4_CR81","unstructured":"Smith, N.A., Heilman, M., Hwa, R.: Question generation as a competitive undergraduate course project. In: Proceedings of the NSF Workshop on the Question Generation Shared Task and Evaluation Challenge (2008)"},{"key":"4_CR82","unstructured":"Tatman, R.: Question-Answer Dataset (2017). https:\/\/www.kaggle.com\/datasets\/rtatman\/questionanswer-dataset\/data. Accessed 14 Dec 2023"},{"key":"4_CR83","unstructured":"Roznovjak, J.: Question-Answer Jokes (2017). https:\/\/www.kaggle.com\/datasets\/jiriroz\/qa-jokes. Accessed 14 Dec 2023"},{"key":"4_CR84","doi-asserted-by":"crossref","unstructured":"Rajpurkar, P., Zhang, J., Lopyrev, K., Liang, P.: SQuAD: 100,000+ questions for machine comprehension of text (2016). arXiv: 1606.05250. https:\/\/arxiv.org\/abs\/1606.05250","DOI":"10.18653\/v1\/D16-1264"},{"key":"4_CR85","unstructured":"Zhou, Q., Yang, N., Wei, F., Tan, C., Bao, H., Zhou, M.: Neural question generation from text: a preliminary study (2017). arXiv: 1704.01792. https:\/\/arxiv.org\/abs\/1704.01792"},{"key":"4_CR86","unstructured":"Code for the paper Neural Question Generation from Text: A Preliminary Study. https:\/\/res.qyzhou.me\/redistribute.zip (download link)"},{"key":"4_CR87","unstructured":"Jiang, L., Risdal, M., Dandekar., et al.: Quora Question Pairs, Kaggle (2017). https:\/\/kaggle.com\/competitions\/quora-question-pairs. Accessed 15 Dec 2023"},{"key":"4_CR88","doi-asserted-by":"crossref","unstructured":"Ribeiro, M.T., Singh, S., Guestrin, C.: \u201cWhy Should I Trust You?\u201d: Explaining the Predictions of Any Classifier (2016). arXiv: 1602.04938. https:\/\/arxiv.org\/abs\/1602.04938","DOI":"10.18653\/v1\/N16-3020"}],"container-title":["Lecture Notes in Computer Science","Big Data Analytics in Astronomy, Science, and Engineering"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-86193-2_4","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,1]],"date-time":"2025-04-01T03:27:50Z","timestamp":1743478070000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-86193-2_4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9783031861925","9783031861932"],"references-count":88,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-86193-2_4","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"31 March 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"BDA","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Big Data Analytics","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Aizu","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Japan","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"26 November 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"28 November 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"12","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"bigda2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/web-ext.u-aizu.ac.jp\/labs\/is-ds\/BDA2024-Aizu.html","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}