{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,1]],"date-time":"2025-10-01T15:29:38Z","timestamp":1759332578413,"version":"3.40.3"},"publisher-location":"Cham","reference-count":29,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031578694"},{"type":"electronic","value":"9783031578700"}],"license":[{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024]]},"DOI":"10.1007\/978-3-031-57870-0_10","type":"book-chapter","created":{"date-parts":[[2024,4,9]],"date-time":"2024-04-09T04:01:52Z","timestamp":1712635312000},"page":"108-122","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Topic Analysis of Japanese Sentences Using Sentence Embeddings"],"prefix":"10.1007","author":[{"given":"Kenshin","family":"Tsumuraya","sequence":"first","affiliation":[]},{"given":"Huang","family":"Yonghui","sequence":"additional","affiliation":[]},{"given":"Minoru","family":"Uehara","sequence":"additional","affiliation":[]},{"given":"Yoshihiro","family":"Adachi","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,4,10]]},"reference":[{"key":"10_CR1","first-page":"993","volume":"3","author":"DM Blei","year":"2003","unstructured":"Blei, D.M., Ng, A.Y., Jordan, M.I.: Latent Dirichlet allocation. J. Mach. Learn. Res. 3, 993\u20131022 (2003)","journal-title":"J. Mach. Learn. Res."},{"key":"10_CR2","unstructured":"Rosen-Zvi, M., Griffiths, T., Steyvers, M., Smyth, P.: The author-topic model for authors and documents. In: Proceedings of the Twentieth Conference on Uncertainty in Artificial Intelligence (UAI2004), pp. 487\u2013494 (2004)"},{"key":"10_CR3","doi-asserted-by":"publisher","unstructured":"Zhao, W.X., Jiang, J., Weng, J., He, J., Lim, E.P.: Comparing Twitter and traditional media using topic models, In: Clough, P., et al. (eds.) Advances in Information Retrieval. ECIR 2011. LNCS, vol. 6611, pp. 338\u2013349. Springer, Cham (2011). https:\/\/doi.org\/10.1007\/978-3-642-20161-5_34","DOI":"10.1007\/978-3-642-20161-5_34"},{"key":"10_CR4","unstructured":"SMU Text Mining Group: Twitter-LDA. https:\/\/github.com\/minghui\/Twitter-LDA. Accessed 8 Jan 2023"},{"key":"10_CR5","unstructured":"Lee, D.D., Seung, H.S.: Algorithms for non-negative matrix factorization. In: Advances in Neural Information Processing Systems 13: Proceedings of the 2000 Conference, pp. 556\u2013562. MIT Press (2001)"},{"key":"10_CR6","doi-asserted-by":"crossref","unstructured":"Sia, S., Dalmia, A., Mielke, S.J.: Tired of topic models? Clusters of pretrained word embeddings make for fast and good topics too! In: Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing, pp. 1728\u20131736 (2020)","DOI":"10.18653\/v1\/2020.emnlp-main.135"},{"key":"10_CR7","unstructured":"Mikolov, T., Chen, K., Corrado, G., Dean, J.: Efficient estimation of word representations in vector space. arXiv:1301.3781 (2013)"},{"key":"10_CR8","unstructured":"Devlin, J., Chang, M.W., Lee, K., Toutanova, K.: BERT: pre-training of deep bidirectional transformers for language understanding. arXiv:1810.04805 (2018)"},{"key":"10_CR9","unstructured":"Grootendorst, M.: BERTopic: Neural topic modeling with a class-based TF-IDF procedure. arXiv:2203.05794 (2022)"},{"key":"10_CR10","doi-asserted-by":"crossref","unstructured":"Reimers, N., Gurevych, I.: Sentence-BERT: sentence embeddings using Siamese BERT-Networks. In: Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing. Association for Computational Linguistics, (Online) (2019). https:\/\/arxiv.org\/abs\/1908.10084","DOI":"10.18653\/v1\/D19-1410"},{"key":"10_CR11","doi-asserted-by":"crossref","unstructured":"Tsumuraya, K., Amano, M., Uehara, M., Adachi, Y.: Topic-based clustering of Japanese sentences using sentence-BERT. In: CANDARW 2022 (2022)","DOI":"10.1109\/CANDARW57323.2022.00044"},{"key":"10_CR12","doi-asserted-by":"publisher","unstructured":"Amano, M., Tsumuraya, K., Uehara, M., Adachi, Y.: An analysis of representative works of Japanese literature based on emotions and topics. In: Barolli, L. (eds.) Advanced Information Networking and Applications. AINA 2023. LNNS, vol. 654, pp. 99\u2013112. Springer, Cham (2023). https:\/\/doi.org\/10.1007\/978-3-031-28451-9_9","DOI":"10.1007\/978-3-031-28451-9_9"},{"key":"10_CR13","doi-asserted-by":"crossref","unstructured":"R\u00f6der, M., Both, A., Hinneburg, A.: Exploring the space of topic coherence measures. In: WSDM 2015: Proceedings of the Eighth ACM International Conference on Web Search and Data Mining, pp. 399\u2013408 (2015)","DOI":"10.1145\/2684822.2685324"},{"key":"10_CR14","doi-asserted-by":"crossref","unstructured":"Terragni, S., Fersini, E., Galuzzi, B.G., Tropeano, P., Candelieri, A.: OCTIS: comparing and optimizing topic models is simple! In: Proceedings of the 16th Conference of the European Chapter of the Association for Computational Linguistics: System Demonstrations, pp. 263\u2013270 (2021)","DOI":"10.18653\/v1\/2021.eacl-demos.31"},{"key":"10_CR15","unstructured":"Chuang, J., Gupta, S., Manning, C.D., Heer, J.: Topic model diagnostics: assessing domain relevance via topical alignment. In: Proceedings of the 30th International Conference on Machine Learning, JMLR: W&CP, vol. 28 (2013)"},{"key":"10_CR16","doi-asserted-by":"crossref","unstructured":"Koren\u010di\u0107, D., Ristov, S., Repar, J., \u0160najder, J.: A topic coverage approach to evaluation of topic models. arXiv:2012.06274 (2021)","DOI":"10.1109\/ACCESS.2021.3109425"},{"key":"10_CR17","unstructured":"National Institute of Information and Communications Technology: NICT BERT Japanese Pre-trained models. https:\/\/alaginrc.nict.go.jp\/nict-bert\/index.html. Accessed 29 Oct 2022"},{"key":"10_CR18","unstructured":"Yoshikoshi, T., Kawahara, D., Kurohashi, S.: Multilingualization of a natural language inference dataset using machine translation, SIG Technical reports, vol. 2020-NL-244, no. 6 (2020). (in Japanese)"},{"key":"10_CR19","unstructured":"Arthur, D., Vassilvitskii, S.: K-means++: The Advantages of Careful Seeding. https:\/\/theory.stanford.edu\/~sergei\/papers\/kMeansPP-soda.pdf. Accessed 16 Aug 2023"},{"key":"10_CR20","first-page":"2825","volume":"12","author":"F Pedregosa","year":"2011","unstructured":"Pedregosa, F., et al.: Scikit-learn: machine learning in Python. J. Mach. Learn. Res. 12, 2825\u20132830 (2011)","journal-title":"J. Mach. Learn. Res."},{"key":"10_CR21","first-page":"2837","volume":"11","author":"NX Vinh","year":"2010","unstructured":"Vinh, N.X., Epps, J., Bailey, J.: Information theoretic measures for clusterings comparison: variants, properties, normalization and correction for chance. J. Mach. Learn. Res. 11, 2837\u20132854 (2010)","journal-title":"J. Mach. Learn. Res."},{"key":"10_CR22","unstructured":"Mikolov, T., Chen, K., Corrado, G.S., Dean, J.: Efficient estimation of word representations in vector space. In: International Conference on Learning Representations, Workshop Track Proceedings (2013)"},{"key":"10_CR23","unstructured":"\u0158eh\u016f\u0159ek, R., Sojka, P.: Software framework for topic modelling with large corpora. In: Proceedings of the LREC 2010 Workshop on New Challenges for NLP (2010)"},{"key":"10_CR24","unstructured":"\u0158eh\u016f\u0159ek, R.: GENSIM: Topic modelling for humans. https:\/\/radimrehurek.com\/gensim\/index.html. Accessed 28 Aug 2023"},{"key":"10_CR25","doi-asserted-by":"crossref","unstructured":"Tsumuraya, K., Uehara, M., Adachi, Y.: Semantic search of Japanese sentences using distributed representations. In: The 8th International Workshop on GPU Computing and AI (2023)","DOI":"10.1109\/CANDARW60564.2023.00021"},{"key":"10_CR26","unstructured":"Akama, R., Isobe, J., Suzuki, J., Inui, K.: Construction of a Japanese Daily dialogue corpus [nihongo nichijyou taiwa corpus no kouchiku]. In: Proceedings of the 29th Annual Meeting of the Association for Natural Language Processing, pp. 108\u2013113 (2023). (in Japanese)"},{"key":"10_CR27","unstructured":"RONDHUIT: Livedoor News Corpus. https:\/\/www.rondhuit.com\/download.html. Accessed 5 Sept 2023"},{"key":"10_CR28","unstructured":"The SciPy community: SciPy. https:\/\/scipy.org\/. Accessed 8 Sept 2023"},{"key":"10_CR29","doi-asserted-by":"crossref","unstructured":"Tsumuraya, K., Uehara, M., Adachi, Y.: Performance Improvement of Semantic Search Using Sentence Embeddings by Dimensionality Reduction, AINA2024 (submitted)","DOI":"10.1007\/978-3-031-57870-0_11"}],"container-title":["Lecture Notes on Data Engineering and Communications Technologies","Advanced Information Networking and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-57870-0_10","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,15]],"date-time":"2024-11-15T22:45:36Z","timestamp":1731710736000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-57870-0_10"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024]]},"ISBN":["9783031578694","9783031578700"],"references-count":29,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-57870-0_10","relation":{},"ISSN":["2367-4512","2367-4520"],"issn-type":[{"type":"print","value":"2367-4512"},{"type":"electronic","value":"2367-4520"}],"subject":[],"published":{"date-parts":[[2024]]},"assertion":[{"value":"10 April 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"AINA","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Advanced Information Networking and Applications","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Kitakyushu","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Japan","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"17 April 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"19 April 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"38","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"aina2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/voyager.ce.fit.ac.jp\/conf\/aina\/2024\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}