{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,29]],"date-time":"2025-11-29T06:57:05Z","timestamp":1764399425147,"version":"3.46.0"},"reference-count":31,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,10,22]],"date-time":"2025-10-22T00:00:00Z","timestamp":1761091200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,10,22]],"date-time":"2025-10-22T00:00:00Z","timestamp":1761091200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,10,22]]},"DOI":"10.1109\/apsipaasc65261.2025.11249317","type":"proceedings-article","created":{"date-parts":[[2025,11,28]],"date-time":"2025-11-28T18:40:26Z","timestamp":1764355226000},"page":"700-705","source":"Crossref","is-referenced-by-count":0,"title":["Collective Learning-Based Optimal Transport GAN with Multi-Level Fine-Grained and Global Discriminators for Voice Conversion"],"prefix":"10.1109","author":[{"given":"Sandipan","family":"Dhar","sequence":"first","affiliation":[{"name":"Indian Institute of Technology,Department of Electrical Engineering,Bombay,India"}]},{"given":"Md. Tousin","family":"Akhter","sequence":"additional","affiliation":[{"name":"Indian Institute of Technology,Department of Computer Science and Engineering,Bombay,India"}]},{"given":"Nanda Dulal","family":"Jana","sequence":"additional","affiliation":[{"name":"National Institute of Technology,Department of Computer Science and Engineering,Durgapur,India"}]},{"given":"Swagatam","family":"Das","sequence":"additional","affiliation":[{"name":"Indian Statistical Institute,Electronics and Communication Sciences Unit,Kolkata,India"}]},{"given":"Monorama","family":"Swain","sequence":"additional","affiliation":[{"name":"Institute of Computational Perception, Johannes Kepler University,Linz,Austria"}]},{"given":"Saurav","family":"Chowdhury","sequence":"additional","affiliation":[{"name":"Indian Institute of Technology,Department of Computer Science and Engineering,Jodhpur,India"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/taslp.2020.3038524"},{"key":"ref2","first-page":"2672","article-title":"Generative adversarial nets","volume-title":"NeurIPS 27","author":"Goodfellow","year":"2014"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/tai.2022.3149858"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/icassp49357.2023.10095069"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/apsipaasc58517.2023.10317438"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-48309-7_20"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/tnnls.2023.3335119"},{"key":"ref8","volume":"abs\/2109.13821","author":"Popov","year":"2021","journal-title":"Diffusion-based voice conversion with fast maximum likelihood sampling scheme"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.3390\/app14209595"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/icais53314.2022.9743083"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/iccci51764.2021.9486805"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/indicon59947.2023.10440809"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2022-517"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2025.3530171"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.3390\/app9071324"},{"volume-title":"Robust speech recognition via large-scale weak supervision","year":"2022","author":"Radford","key":"ref16"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr46437.2021.00383"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00888"},{"key":"ref19","volume":"abs\/2206.11114","author":"Zhang","year":"2022","journal-title":"Evolutionary game-theoretical analysis for general multiplayer asymmetric games"},{"key":"ref20","article-title":"The cmu arctic speech databases","volume-title":"Proc. Speech Synthesis Workshop","author":"Kominek","year":"2004"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP39728.2021.9414851"},{"key":"ref22","first-page":"19594","article-title":"Styletts 2: Towards human-level text-tospeech through style diffusion and adversarial training with large speech language models","volume-title":"NeurIPS","volume":"36","author":"Li","year":"2023"},{"key":"ref23","volume":"abs\/1803.05573","author":"Salimans","year":"2018","journal-title":"Improving gans using optimal transport"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.3390\/sym13071147"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.23919\/apsipaasc55919.2022.9980151"},{"key":"ref26","article-title":"Adam: A method for stochastic optimization","volume":"abs\/1412.6980","author":"Kingma","year":"2014","journal-title":"CoRR"},{"key":"ref27","volume":"abs\/2010.05646","author":"Kong","year":"2020","journal-title":"Hifi-gan: Generative adversarial networks for efficient and high fidelity speech synthesis"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/lsp.2019.2961213"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/slt48900.2021.9383498"},{"key":"ref30","volume":"abs\/2504.19197","author":"Dhar","year":"2025","journal-title":"Generative adversarial network based voice conversion: Techniques, challenges, and recent advancements"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10097255"}],"event":{"name":"2025 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","start":{"date-parts":[[2025,10,22]]},"location":"Singapore, Singapore","end":{"date-parts":[[2025,10,24]]}},"container-title":["2025 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11248853\/11248968\/11249317.pdf?arnumber=11249317","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,29]],"date-time":"2025-11-29T06:54:47Z","timestamp":1764399287000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11249317\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,22]]},"references-count":31,"URL":"https:\/\/doi.org\/10.1109\/apsipaasc65261.2025.11249317","relation":{},"subject":[],"published":{"date-parts":[[2025,10,22]]}}}