{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,31]],"date-time":"2026-03-31T14:25:33Z","timestamp":1774967133160,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":13,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,12,6]],"date-time":"2023-12-06T00:00:00Z","timestamp":1701820800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/"}],"funder":[{"name":"National Science and Technology Development Agency, Thailand"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,12,6]]},"DOI":"10.1145\/3628454.3631582","type":"proceedings-article","created":{"date-parts":[[2023,11,28]],"date-time":"2023-11-28T19:43:41Z","timestamp":1701200621000},"page":"1-5","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":2,"title":["Alaryngeal Speech Generation Using MaskCycleGAN-VC and Timbre-Enhanced Loss"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0002-0746-8266","authenticated-orcid":false,"given":"Hnin Yadana","family":"Lwin","sequence":"first","affiliation":[{"name":"King Mongkut's University of Technology Thonburi, Thailand"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2957-6084","authenticated-orcid":false,"given":"Wuttipong","family":"Kumwilaisak","sequence":"additional","affiliation":[{"name":"King Mongkut's University of Technology Thonburi, Thailand"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4064-4882","authenticated-orcid":false,"given":"Chatchawarn","family":"Hansakunbuntheung","sequence":"additional","affiliation":[{"name":"National Science and Technology Development Agency, Thailand"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8240-2772","authenticated-orcid":false,"given":"Nattanun","family":"Thatphithakkul","sequence":"additional","affiliation":[{"name":"National Science and Technology Development Agency, Thailand"}]}],"member":"320","published-online":{"date-parts":[[2023,12,6]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"Proceedings of the 33rd International Conference on International Conference on Machine Learning -","volume":"48","author":"Amodei Dario","year":"2016","unstructured":"Dario Amodei 2016. Deep Speech 2: End-to-end speech recognition in English and Mandarin. In Proceedings of the 33rd International Conference on International Conference on Machine Learning - Volume 48 (New York, NY, USA) (ICML\u201916). 173\u2013182."},{"key":"e_1_3_2_1_2_1","volume-title":"Aidan adn Elsen\u00a0Erich Dieleman","author":"Bi\u0144kowski Miko\u0142aj","year":"2020","unstructured":"Miko\u0142aj Bi\u0144kowski, Jeff Donahue, Aidan adn Elsen\u00a0Erich Dieleman, Sander adn\u00a0Clark, Norman Casagrande, Luis\u00a0C. Cobo, and Karen Simonyan. 2020. High Fidelity Speech Synthesis with Adversarial Networks. (2020). https:\/\/openreview.net\/forum?id=r1gfQgSFDr"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2022-10868"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2019.8682897"},{"key":"e_1_3_2_1_5_1","volume-title":"Interspeech","author":"Kaneko Takuhiro","year":"2020","unstructured":"Takuhiro Kaneko, Hirokazu Kameoka, Kou Tanaka, and Nobukatsu Hojo. 2020. Cyclegan-VC3: Examining and improving Cyclegan-VCs for Mel-Spectrogram Conversion. In Interspeech 2020."},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP39728.2021.9414851"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"crossref","unstructured":"Kevin Kilgour Mauricio Zuluaga Dominik Roblek and Matthew Sharifi. 2019. Fr\u00e9chet audio distance: A reference-free metric for evaluating music enhancement algorithms. In INTERSPEECH.","DOI":"10.21437\/Interspeech.2019-2219"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1109\/PACRIM.1993.407206"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46487-9_43"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.304"},{"key":"e_1_3_2_1_11_1","volume-title":"Specaugment: A simple data augmentation method for automatic speech recognition. arXiv preprint arXiv:1904.08779","author":"Park S.","year":"2019","unstructured":"Daniel\u00a0S. Park, William Chan, Yu Zhang, Chung-Cheng Chiu, Barret Zoph, Ekin\u00a0D. Cubuk, and Quoc\u00a0V. Le. 2019. Specaugment: A simple data augmentation method for automatic speech recognition. arXiv preprint arXiv:1904.08779 (2019)."},{"key":"e_1_3_2_1_12_1","volume-title":"Accessed","author":"AI.","year":"2021","unstructured":"Resemble-AI. 2021. Resemblyzer: A Python package to analyze and compare voices with deep learning. https:\/\/github.com\/resemble-ai\/Resemblyzer. Accessed: Aug. 24, 2023."},{"key":"e_1_3_2_1_13_1","first-page":"115","article-title":"Perceptual evaluation of alaryngeal speech","volume":"36","author":"Rosso Marinela","year":"2012","unstructured":"Marinela Rosso, Ljiljana Siri\u0107, Robert Ti\u0107ac, Radan Starcevi\u0107, Igor Segec, and Nikola Kraljik. 2012. Perceptual evaluation of alaryngeal speech. Collegium Antropologicum 36, Suppl 2 (2012), 115\u2013118.","journal-title":"Collegium Antropologicum"}],"event":{"name":"IAIT 2023: 13th International Conference on Advances in Information Technology","location":"Bangkok Thailand","acronym":"IAIT 2023"},"container-title":["Proceedings of the 13th International Conference on Advances in Information Technology"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3628454.3631582","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3628454.3631582","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T23:46:39Z","timestamp":1755906399000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3628454.3631582"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,12,6]]},"references-count":13,"alternative-id":["10.1145\/3628454.3631582","10.1145\/3628454"],"URL":"https:\/\/doi.org\/10.1145\/3628454.3631582","relation":{},"subject":[],"published":{"date-parts":[[2023,12,6]]},"assertion":[{"value":"2023-12-06","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}