{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,15]],"date-time":"2025-11-15T07:32:53Z","timestamp":1763191973588,"version":"3.45.0"},"reference-count":34,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,6,30]],"date-time":"2025-06-30T00:00:00Z","timestamp":1751241600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,6,30]],"date-time":"2025-06-30T00:00:00Z","timestamp":1751241600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,6,30]]},"DOI":"10.1109\/ijcnn64981.2025.11228946","type":"proceedings-article","created":{"date-parts":[[2025,11,14]],"date-time":"2025-11-14T18:46:15Z","timestamp":1763145975000},"page":"1-10","source":"Crossref","is-referenced-by-count":0,"title":["S2N: A Synthetic Data-Driven Approach for Speaker-To-Dialogue Attribution in Novels"],"prefix":"10.1109","author":[{"given":"Yiqian","family":"Huang","sequence":"first","affiliation":[{"name":"Institute of Science Tokyo,Tokyo,Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ying","family":"Zhang","sequence":"additional","affiliation":[{"name":"RIKEN Center for Advanced Intelligence Project,Sendai,Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kotaro","family":"Funakoshi","sequence":"additional","affiliation":[{"name":"Institute of Science Tokyo,Tokyo,Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Manabu","family":"Okumura","sequence":"additional","affiliation":[{"name":"Institute of Science Tokyo,Tokyo,Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yang","family":"Cao","sequence":"additional","affiliation":[{"name":"Institute of Science Tokyo,Tokyo,Japan"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","first-page":"5820","article-title":"What does the sea say to the shore? a BERT based DST style approach for speaker to dialogue attribution in novels","volume-title":"Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","author":"Cuesta-Lazaro"},{"key":"ref2","first-page":"2274","article-title":"End-to-end Chinese speaker identification","volume-title":"Proceedings of the 2022 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies","author":"Yu"},{"key":"ref3","first-page":"460","article-title":"A two-stage sieve approach for quote attribution","volume-title":"Proceedings of the 15th Conference of the European Chapter of the Association for Computational Linguistics: Volume 1, Long Papers","author":"Muzny"},{"key":"ref4","first-page":"1312","article-title":"Identification of speakers in novels","volume-title":"Proceedings of the 51st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","author":"He"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2021-609"},{"key":"ref6","first-page":"3455","article-title":"Symbolization, prompt, and classification: A framework for implicit speaker identification in novels","volume-title":"Findings of the Association for Computational Linguistics: EMNLP 2023","author":"Chen"},{"article-title":"The curse of recursion: Training on generated data makes models forget","year":"2024","author":"Shumailov","key":"ref7"},{"key":"ref8","doi-asserted-by":"crossref","DOI":"10.18653\/v1\/2024.findings-emnlp.873","article-title":"Unveiling the flaws: Exploring imperfections in synthetic data and mitigation strategies for large language models","author":"Chen","year":"2024"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1038\/s41586-024-07566-y"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i18.29955"},{"key":"ref11","article-title":"Large language model as attributed training data generator: A tale of diversity and bias","volume":"36","author":"Yu","year":"2024","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.findings-naacl.228"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.findings-emnlp.873"},{"key":"ref14","first-page":"4171","article-title":"BERT: Pre-training of deep bidirectional transformers for language understanding","volume-title":"Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers)","author":"Devlin"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.2139\/ssrn.5250633"},{"key":"ref16","first-page":"634","article-title":"Benchmarking robustness of machine reading comprehension models","volume-title":"Findings of the Association for Computational Linguistics: ACL-IJCNLP 2021","author":"Si"},{"key":"ref17","first-page":"2470","article-title":"Evaluating neural model robustness for machine comprehension","volume-title":"Proceedings of the 16th Conference of the European Chapter of the Association for Computational Linguistics: Main Volume","author":"Wu"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i05.6357"},{"key":"ref19","first-page":"18 661","article-title":"Supervised contrastive learning","volume":"33","author":"Khosla","year":"2020","journal-title":"Advances in neural information processing systems"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.emnlp-main.552"},{"key":"ref21","first-page":"3898","article-title":"ESimCSE: Enhanced sample building method for contrastive learning of unsupervised sentence embedding","volume-title":"Proceedings of the 29th International Conference on Computational Linguistics","author":"Wu"},{"key":"ref22","first-page":"9929","article-title":"Understanding contrastive representation learning through alignment and uniformity on the hypersphere","volume-title":"International conference on machine learning","author":"Wang"},{"article-title":"Early stopping against label noise without validation data","volume-title":"The Twelfth International Conference on Learning Representations","author":"Yuan","key":"ref23"},{"key":"ref24","first-page":"24 392","article-title":"Understanding and improving early stopping for learning with noisy labels","volume":"34","author":"Bai","year":"2021","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref25","first-page":"1885","article-title":"Understanding black-box predictions via influence functions","volume-title":"International conference on machine learning","author":"Koh"},{"key":"ref26","first-page":"19 920","article-title":"Estimating training data influence by tracing gradient descent","volume":"33","author":"Pruthi","year":"2020","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i17.29870"},{"journal-title":"Cped: A large-scale chinese personalized and emotional dialogue dataset for conversational ai","year":"2022","author":"Chen","key":"ref28"},{"key":"ref29","first-page":"610","article-title":"MPDD: A multiparty dialogue dataset for analysis of emotions and interpersonal relationships","volume-title":"Proceedings of the Twelfth Language Resources and Evaluation Conference","author":"Chen"},{"key":"ref30","first-page":"2337","article-title":"The CRECIL corpus: a new dataset for extraction of relations between characters in Chinese multi-party dialogues","volume-title":"Proceedings of the Thirteenth Language Resources and Evaluation Conference","author":"Jiang"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/APSIPAASC47483.2019.9023129"},{"key":"ref32","first-page":"2383","article-title":"SQuAD: 100, 000+ questions for machine comprehension of text","volume-title":"Proceedings of the 2016 Conference on Empirical Methods in Natural Language Processing","author":"Rajpurkar"},{"key":"ref33","first-page":"4762","article-title":"CLUE: A Chinese language understanding evaluation benchmark","volume-title":"Proceedings of the 28th International Conference on Computational Linguistics","author":"Xu"},{"key":"ref34","first-page":"657","article-title":"Revisiting pre-trained models for Chinese natural language processing","volume-title":"Findings of the Association for Computational Linguistics: EMNLP 2020","author":"Cui"}],"event":{"name":"2025 International Joint Conference on Neural Networks (IJCNN)","start":{"date-parts":[[2025,6,30]]},"location":"Rome, Italy","end":{"date-parts":[[2025,7,5]]}},"container-title":["2025 International Joint Conference on Neural Networks (IJCNN)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11227166\/11227148\/11228946.pdf?arnumber=11228946","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,15]],"date-time":"2025-11-15T07:28:51Z","timestamp":1763191731000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11228946\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,6,30]]},"references-count":34,"URL":"https:\/\/doi.org\/10.1109\/ijcnn64981.2025.11228946","relation":{},"subject":[],"published":{"date-parts":[[2025,6,30]]}}}