{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,28]],"date-time":"2026-01-28T20:25:37Z","timestamp":1769631937258,"version":"3.49.0"},"publisher-location":"New York, NY, USA","reference-count":31,"publisher":"ACM","funder":[{"name":"UKRI AI World Leading Re- searcher Fellowship","award":["EP\/W002949\/1"],"award-info":[{"award-number":["EP\/W002949\/1"]}]},{"name":"JPMC Faculty Research Award","award":[""],"award-info":[{"award-number":[""]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,11,15]]},"DOI":"10.1145\/3768292.3770442","type":"proceedings-article","created":{"date-parts":[[2025,11,14]],"date-time":"2025-11-14T07:24:26Z","timestamp":1763105066000},"page":"211-219","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":1,"title":["Discrete Flow Matching is a Surprisingly Effective Post-training Method to Address Compound Error in Autoregressive Models"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0007-7847-9292","authenticated-orcid":false,"given":"Kang","family":"Li","sequence":"first","affiliation":[{"name":"Department of Statistics, University of Oxford, Oxford, United Kingdom"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0584-3504","authenticated-orcid":false,"given":"Bidipta","family":"Sarkar","sequence":"additional","affiliation":[{"name":"Foerster Lab for AI Research, University of Oxford, Oxford, United Kingdom"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5707-5415","authenticated-orcid":false,"given":"Zheng","family":"Xiong","sequence":"additional","affiliation":[{"name":"Department of Computer Science, University of Oxford, Oxford, United Kingdom"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-6265-9607","authenticated-orcid":false,"given":"Sascha","family":"Frey","sequence":"additional","affiliation":[{"name":"Department of Computer Science, University of Oxford, Oxford, United Kingdom"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-6062-3015","authenticated-orcid":false,"given":"Zilin","family":"Wang","sequence":"additional","affiliation":[{"name":"Foerster Lab for AI Research, University of Oxford, Oxford, United Kingdom"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-1947-6154","authenticated-orcid":false,"given":"Frensi","family":"Zejnullahu","sequence":"additional","affiliation":[{"name":"Department of Statistics, University of Oxford, Oxford, United Kingdom"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-2218-1734","authenticated-orcid":false,"given":"Alfred","family":"Backhouse","sequence":"additional","affiliation":[{"name":"Department of Computer Science, University of Oxford, Oxford, United Kingdom"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3392-0394","authenticated-orcid":false,"given":"Stefan","family":"Zohren","sequence":"additional","affiliation":[{"name":"Department of Engineering Science, University of Oxford, Oxford, United Kingdom"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2082-734X","authenticated-orcid":false,"given":"Anisoara","family":"Calinescu","sequence":"additional","affiliation":[{"name":"Department of Computer Science, University of Oxford, Oxford, United Kingdom"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8464-2152","authenticated-orcid":false,"given":"Mihai","family":"Cucuringu","sequence":"additional","affiliation":[{"name":"Department of Mathematics, University of California Los Angeles, Los Angeles, USA and Department of Statistics &amp; Oxford Man Institute of Quantitative Finance, Oxford, United Kingdom"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9688-2498","authenticated-orcid":false,"given":"Jakob","family":"Foerster","sequence":"additional","affiliation":[{"name":"Foerster Lab for AI Research, University of Oxford, Oxford, United Kingdom"}]}],"member":"320","published-online":{"date-parts":[[2025,11,14]]},"reference":[{"key":"e_1_3_3_1_2_2","volume-title":"Advances in Neural Information Processing Systems","author":"Austin Jacob","year":"2021","unstructured":"Jacob Austin, Daniel\u00a0D. Johnson, Jonathan Ho, Daniel Tarlow, and Rianne van\u00a0den Berg. 2021. Structured Denoising Diffusion Models in Discrete State-Spaces. In Advances in Neural Information Processing Systems, A.\u00a0Beygelzimer, Y.\u00a0Dauphin, P.\u00a0Liang, and J.\u00a0Wortman Vaughan (Eds.). https:\/\/openreview.net\/forum?id=h7-XixPCAL"},{"key":"e_1_3_3_1_3_2","doi-asserted-by":"publisher","DOI":"10.5555\/2969239.2969370"},{"key":"e_1_3_3_1_4_2","first-page":"1877","volume-title":"Advances in Neural Information Processing Systems","author":"Brown Tom","year":"2020","unstructured":"Tom Brown, Benjamin Mann, Nick Ryder, Melanie Subbiah, Jared\u00a0D Kaplan, Prafulla Dhariwal, Arvind Neelakantan, Pranav Shyam, Girish Sastry, Amanda Askell, Sandhini Agarwal, Ariel Herbert-Voss, Gretchen Krueger, Tom Henighan, Rewon Child, Aditya Ramesh, Daniel Ziegler, Jeffrey Wu, Clemens Winter, Chris Hesse, Mark Chen, Eric Sigler, Mateusz Litwin, Scott Gray, Benjamin Chess, Jack Clark, Christopher Berner, Sam McCandlish, Alec Radford, Ilya Sutskever, and Dario Amodei. 2020. Language Models are Few-Shot Learners. In Advances in Neural Information Processing Systems , H.\u00a0Larochelle, M.\u00a0Ranzato, R.\u00a0Hadsell, M.F. Balcan, and H.\u00a0Lin (Eds.), Vol.\u00a033. Curran Associates, Inc., 1877\u20131901. https:\/\/proceedings.neurips.cc\/paper_files\/paper\/2020\/file\/1457c0d6bfcb4967418bfb8ac142f64a-Paper.pdf"},{"key":"e_1_3_3_1_5_2","series-title":"(ICML\u201924)","volume-title":"Proceedings of the 41st International Conference on Machine Learning","author":"Campbell Andrew","year":"2024","unstructured":"Andrew Campbell, Jason Yim, Regina Barzilay, Tom Rainforth, and Tommi Jaakkola. 2024. Generative flows on discrete state-spaces: enabling multimodal flows with applications to protein co-design. In Proceedings of the 41st International Conference on Machine Learning (Vienna, Austria) (ICML\u201924). JMLR.org, Article 213, 60\u00a0pages."},{"key":"e_1_3_3_1_6_2","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01103"},{"key":"e_1_3_3_1_7_2","volume-title":"International Conference on Learning Representations","author":"Che Tong","year":"2017","unstructured":"Tong Che, Yanran Li, Athul Jacob, Yoshua Bengio, and Wenjie Li. 2017. Mode Regularized Generative Adversarial Networks. In International Conference on Learning Representations. https:\/\/openreview.net\/forum?id=HJKkY35le"},{"key":"e_1_3_3_1_8_2","unstructured":"Xiaokang Chen Zhiyu Wu Xingchao Liu Zizheng Pan Wen Liu Zhenda Xie Xingkai Yu and Chong Ruan. 2025. Janus-Pro: Unified Multimodal Understanding and Generation with Data and Model Scaling. arxiv:https:\/\/arXiv.org\/abs\/2501.17811\u00a0[cs.AI] https:\/\/arxiv.org\/abs\/2501.17811"},{"key":"e_1_3_3_1_9_2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1633"},{"key":"e_1_3_3_1_10_2","unstructured":"Ian\u00a0J. Goodfellow Jean Pouget-Abadie Mehdi Mirza Bing Xu David Warde-Farley Sherjil Ozair Aaron Courville and Yoshua Bengio. 2014. Generative Adversarial Networks. arxiv:https:\/\/arXiv.org\/abs\/1406.2661\u00a0[stat.ML] https:\/\/arxiv.org\/abs\/1406.2661"},{"key":"e_1_3_3_1_11_2","first-page":"135011","volume-title":"Advances in Neural Information Processing Systems","volume":"37","author":"Kapu\u015bniak Kacper","year":"2024","unstructured":"Kacper Kapu\u015bniak, Peter Potaptchik, Teodora Reu, Leo Zhang, Alexander Tong, Michael Bronstein, Avishek\u00a0Joey Bose, and Francesco Di\u00a0Giovanni. 2024. Metric Flow Matching for Smooth Interpolations on the Data Manifold. In Advances in Neural Information Processing Systems , A.\u00a0Globerson, L.\u00a0Mackey, D.\u00a0Belgrave, A.\u00a0Fan, U.\u00a0Paquet, J.\u00a0Tomczak, and C.\u00a0Zhang (Eds.), Vol.\u00a037. Curran Associates, Inc., 135011\u2013135042. https:\/\/proceedings.neurips.cc\/paper_files\/paper\/2024\/file\/f381114cf5aba4e45552869863deaaa7-Paper-Conference.pdf"},{"key":"e_1_3_3_1_12_2","volume-title":"Advances in Neural Information Processing Systems","author":"Lamb Alex\u00a0M","year":"2016","unstructured":"Alex\u00a0M Lamb, Anirudh\u00a0Goyal ALIAS PARTH\u00a0GOYAL, Ying Zhang, Saizheng Zhang, Aaron\u00a0C Courville, and Yoshua Bengio. 2016. Professor Forcing: A New Algorithm for Training Recurrent Networks. In Advances in Neural Information Processing Systems , D.\u00a0Lee, M.\u00a0Sugiyama, U.\u00a0Luxburg, I.\u00a0Guyon, and R.\u00a0Garnett (Eds.), Vol.\u00a029. Curran Associates, Inc.https:\/\/proceedings.neurips.cc\/paper_files\/paper\/2016\/file\/16026d60ff9b54410b3435b403afd226-Paper.pdf"},{"key":"e_1_3_3_1_13_2","unstructured":"Yuchen Li Alexandre Kirchmeyer Aashay Mehta Yilong Qin Boris Dadachev Kishore Papineni Sanjiv Kumar and Andrej Risteski. 2024. Promises and Pitfalls of Generative Masked Language Modeling: Theoretical Framework and Practical Guidelines. arxiv:https:\/\/arXiv.org\/abs\/2407.21046\u00a0[cs.CL] https:\/\/arxiv.org\/abs\/2407.21046"},{"key":"e_1_3_3_1_14_2","unstructured":"Yaron Lipman et\u00a0al. 2023. Flow matching for generative modeling. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2210.02747 (2023)."},{"key":"e_1_3_3_1_15_2","volume-title":"The Eleventh International Conference on Learning Representations","author":"Lipman Yaron","year":"2023","unstructured":"Yaron Lipman, Ricky T.\u00a0Q. Chen, Heli Ben-Hamu, Maximilian Nickel, and Matthew Le. 2023. Flow Matching for Generative Modeling. In The Eleventh International Conference on Learning Representations. https:\/\/openreview.net\/forum?id=PqvMRDCJT9t"},{"key":"e_1_3_3_1_16_2","unstructured":"Yiyang Ma Xingchao Liu Xiaokang Chen Wen Liu Chengyue Wu Zhiyu Wu Zizheng Pan Zhenda Xie Haowei Zhang Xingkai yu Liang Zhao Yisong Wang Jiaying Liu and Chong Ruan. 2025. JanusFlow: Harmonizing Autoregression and Rectified Flow for Unified Multimodal Understanding and Generation. arxiv:https:\/\/arXiv.org\/abs\/2411.07975\u00a0[cs.CV] https:\/\/arxiv.org\/abs\/2411.07975"},{"key":"e_1_3_3_1_17_2","unstructured":"Peer Nagy Sascha Frey Kang Li Bidipta Sarkar Svitlana Vyetrenko Stefan Zohren Ani Calinescu and Jakob Foerster. 2025. LOB-Bench: Benchmarking Generative AI for Finance \u2013 an Application to Limit Order Book Data. arxiv:https:\/\/arXiv.org\/abs\/2502.09172\u00a0[cs.LG] https:\/\/arxiv.org\/abs\/2502.09172"},{"key":"e_1_3_3_1_18_2","doi-asserted-by":"crossref","unstructured":"Peer Nagy Sascha Frey Silvia Sapora Kang Li Anisoara Calinescu Stefan Zohren and Jakob Foerster. 2023. Generative AI for End-to-End Limit Order Book Modelling: A Token-Level Autoregressive Generative Model of Message Flow Using a Deep State Space Network. arxiv:https:\/\/arXiv.org\/abs\/2309.00638\u00a0[q-fin.TR] https:\/\/arxiv.org\/abs\/2309.00638","DOI":"10.1145\/3604237.3626898"},{"key":"e_1_3_3_1_19_2","unstructured":"Shen Nie Fengqi Zhu Zebin You Xiaolu Zhang Jingyang Ou Jun Hu Jun Zhou Yankai Lin Ji-Rong Wen and Chongxuan Li. 2025. Large Language Diffusion Models. arxiv:https:\/\/arXiv.org\/abs\/2502.09992\u00a0[cs.CL] https:\/\/arxiv.org\/abs\/2502.09992"},{"key":"e_1_3_3_1_20_2","series-title":"Proceedings of Machine Learning Research","first-page":"8821","volume-title":"Proceedings of the 38th International Conference on Machine Learning","volume":"139","author":"Ramesh Aditya","year":"2021","unstructured":"Aditya Ramesh, Mikhail Pavlov, Gabriel Goh, Scott Gray, Chelsea Voss, Alec Radford, Mark Chen, and Ilya Sutskever. 2021. Zero-Shot Text-to-Image Generation. In Proceedings of the 38th International Conference on Machine Learning(Proceedings of Machine Learning Research, Vol.\u00a0139), Marina Meila and Tong Zhang (Eds.). PMLR, 8821\u20138831. https:\/\/proceedings.mlr.press\/v139\/ramesh21a.html"},{"key":"e_1_3_3_1_21_2","unstructured":"Marc\u2019Aurelio Ranzato Sumit Chopra Michael Auli and Wojciech Zaremba. 2016. Sequence Level Training with Recurrent Neural Networks. arxiv:https:\/\/arXiv.org\/abs\/1511.06732\u00a0[cs.LG] https:\/\/arxiv.org\/abs\/1511.06732"},{"key":"e_1_3_3_1_22_2","unstructured":"Subham Sahoo et\u00a0al. 2024. Simple and effective masked diffusion language models. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2406.07524 (2024)."},{"key":"e_1_3_3_1_23_2","unstructured":"Subham\u00a0Sekhar Sahoo Justin Deschenaux Aaron Gokaslan Guanghan Wang Justin Chiu and Volodymyr Kuleshov. 2025. The Diffusion Duality. arxiv:https:\/\/arXiv.org\/abs\/2506.10892\u00a0[cs.LG] https:\/\/arxiv.org\/abs\/2506.10892"},{"key":"e_1_3_3_1_24_2","volume-title":"The Thirteenth International Conference on Learning Representations","author":"Shaul Neta","year":"2025","unstructured":"Neta Shaul, Itai Gat, Marton Havasi, Daniel Severo, Anuroop Sriram, Peter Holderrieth, Brian Karrer, Yaron Lipman, and Ricky T.\u00a0Q. Chen. 2025. Flow Matching with General Discrete Paths: A Kinetic-Optimal Perspective. In The Thirteenth International Conference on Learning Representations. https:\/\/openreview.net\/forum?id=tcvMzR2NrP"},{"key":"e_1_3_3_1_25_2","unstructured":"Akash Srivastava Lazar Valkov Chris Russell Michael\u00a0U. Gutmann and Charles Sutton. 2017. VEEGAN: Reducing Mode Collapse in GANs using Implicit Variational Learning. arxiv:https:\/\/arXiv.org\/abs\/1705.07761\u00a0[stat.ML] https:\/\/arxiv.org\/abs\/1705.07761"},{"key":"e_1_3_3_1_26_2","unstructured":"Zhicong Tang Tiankai Hang Shuyang Gu Dong Chen and Baining Guo. 2024. Simplified Diffusion Schr\u00f6dinger Bridge. arxiv:https:\/\/arXiv.org\/abs\/2403.14623\u00a0[cs.LG] https:\/\/arxiv.org\/abs\/2403.14623"},{"key":"e_1_3_3_1_27_2","volume-title":"Advances in Neural Information Processing Systems","author":"Vaswani Ashish","year":"2017","unstructured":"Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszkoreit, Llion Jones, Aidan\u00a0N Gomez, \u0141\u00a0ukasz Kaiser, and Illia Polosukhin. 2017. Attention is All you Need. In Advances in Neural Information Processing Systems , I.\u00a0Guyon, U.\u00a0Von Luxburg, S.\u00a0Bengio, H.\u00a0Wallach, R.\u00a0Fergus, S.\u00a0Vishwanathan, and R.\u00a0Garnett (Eds.), Vol.\u00a030. Curran Associates, Inc.https:\/\/proceedings.neurips.cc\/paper_files\/paper\/2017\/file\/3f5ee243547dee91fbd053c1c4a845aa-Paper.pdf"},{"key":"e_1_3_3_1_28_2","unstructured":"Jin Wang Yao Lai Aoxue Li Shifeng Zhang Jiacheng Sun Ning Kang Chengyue Wu Zhenguo Li and Ping Luo. 2025. FUDOKI: Discrete Flow-based Unified Understanding and Generation via Kinetic-Optimal Velocities. (2025). arxiv:https:\/\/arXiv.org\/abs\/2505.20147\u00a0[cs.CV] https:\/\/arxiv.org\/abs\/2505.20147"},{"key":"e_1_3_3_1_29_2","unstructured":"Chengyue Wu Xiaokang Chen Zhiyu Wu Yiyang Ma Xingchao Liu Zizheng Pan Wen Liu Zhenda Xie Xingkai Yu Chong Ruan et\u00a0al. 2024. Janus: Decoupling visual encoding for unified multimodal understanding and generation. arXiv preprint arXiv:https:\/\/arXiv.org\/abs\/2410.13848 (2024)."},{"key":"e_1_3_3_1_30_2","unstructured":"Zhilin Yang Zihang Dai Yiming Yang Jaime Carbonell Russ\u00a0R Salakhutdinov and Quoc\u00a0V Le. 2019. XLNet: Generalized Autoregressive Pretraining for Language Understanding. Advances in neural information processing systems 32 (2019)."},{"key":"e_1_3_3_1_31_2","unstructured":"Lantao Yu Weinan Zhang Jun Wang and Yong Yu. 2017. SeqGAN: Sequence Generative Adversarial Nets with Policy Gradient. arxiv:https:\/\/arXiv.org\/abs\/1609.05473\u00a0[cs.LG] https:\/\/arxiv.org\/abs\/1609.05473"},{"key":"e_1_3_3_1_32_2","unstructured":"Lin Zheng Jianbo Yuan Lei Yu and Lingpeng Kong. 2024. A Reparameterized Discrete Diffusion Model for Text Generation. arxiv:https:\/\/arXiv.org\/abs\/2302.05737\u00a0[cs.CL] https:\/\/arxiv.org\/abs\/2302.05737"}],"event":{"name":"ICAIF '25: 6th ACM International Conference on AI in Finance","location":"Singapore Singapore","acronym":"ICAIF '25"},"container-title":["Proceedings of the 6th ACM International Conference on AI in Finance"],"original-title":[],"deposited":{"date-parts":[[2025,11,14]],"date-time":"2025-11-14T07:31:36Z","timestamp":1763105496000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3768292.3770442"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,11,14]]},"references-count":31,"alternative-id":["10.1145\/3768292.3770442","10.1145\/3768292"],"URL":"https:\/\/doi.org\/10.1145\/3768292.3770442","relation":{},"subject":[],"published":{"date-parts":[[2025,11,14]]},"assertion":[{"value":"2025-11-14","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}