{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,7]],"date-time":"2026-01-07T08:09:54Z","timestamp":1767773394527,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":53,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,11,25]],"date-time":"2023-11-25T00:00:00Z","timestamp":1700870400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,11,27]]},"DOI":"10.1145\/3604237.3626841","type":"proceedings-article","created":{"date-parts":[[2023,11,25]],"date-time":"2023-11-25T18:09:47Z","timestamp":1700935787000},"page":"124-132","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":5,"title":["SigFormer: Signature Transformers for Deep Hedging"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0008-2494-0044","authenticated-orcid":false,"given":"Anh","family":"Tong","sequence":"first","affiliation":[{"name":"Graduate School of AI, KAIST, KR"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1917-2190","authenticated-orcid":false,"given":"Thanh","family":"Nguyen-Tang","sequence":"additional","affiliation":[{"name":"Johns Hopkins University, US"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3306-1566","authenticated-orcid":false,"given":"Dongeun","family":"Lee","sequence":"additional","affiliation":[{"name":"Texas A&amp;M University-Commerce, US"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7182-7548","authenticated-orcid":false,"given":"Toan M","family":"Tran","sequence":"additional","affiliation":[{"name":"VinAI Research, VN"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4663-3263","authenticated-orcid":false,"given":"Jaesik","family":"Choi","sequence":"additional","affiliation":[{"name":"Graduate School of AI, KAIST\/INEEJI, KR"}]}],"member":"320","published-online":{"date-parts":[[2023,11,25]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1145\/3383455.3422553"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"crossref","unstructured":"Alvaro Arroyo Alvaro Cartea Fernando Moreno-Pino and Stefan Zohren. 2023. Deep Attentive Survival Analysis in Limit Order Books: Estimating Fill Probabilities with Convolutional-Transformers. arxiv:2306.05479\u00a0[q-fin.ST]","DOI":"10.2139\/ssrn.4432087"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"crossref","unstructured":"Fazl Barez Paul Bilokon Arthur Gervais and Nikita Lisitsyn. 2023. Exploring the Advantages of Transformers for High-Frequency Trading. arxiv:2302.13850\u00a0[q-fin.ST]","DOI":"10.2139\/ssrn.4364833"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1080\/14697688.2015.1099717"},{"key":"e_1_3_2_1_5_1","unstructured":"Christian Bayer and Benjamin Stemper. 2018. Deep calibration of rough stochastic volatility models. arxiv:1810.03399\u00a0[q-fin.PR]"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1007\/s00780-017-0335-5"},{"key":"e_1_3_2_1_7_1","unstructured":"James Bradbury Roy Frostig Peter Hawkins Matthew\u00a0James Johnson Chris Leary Dougal Maclaurin George Necula Adam Paszke Jake VanderPlas Skye Wanderman-Milne and Qiao Zhang. 2018. JAX: composable transformations of Python+NumPy programs. http:\/\/github.com\/google\/jax"},{"key":"e_1_3_2_1_8_1","volume-title":"Language models are few-shot learners. Advances in neural information processing systems 33","author":"Brown Tom","year":"2020","unstructured":"Tom Brown, Benjamin Mann, Nick Ryder, Melanie Subbiah, Jared\u00a0D Kaplan, Prafulla Dhariwal, Arvind Neelakantan, Pranav Shyam, Girish Sastry, Amanda Askell, 2020. Language models are few-shot learners. Advances in neural information processing systems 33 (2020), 1877\u20131901."},{"key":"e_1_3_2_1_9_1","volume-title":"Lecture Notes Learning to Trade I: Statistical Hedging. Lecture Notes Learning to Trade I: Statistical Hedging (June 30","author":"Buehler Hans","year":"2022","unstructured":"Hans Buehler and Blanka Horvath. 2022. Lecture Notes Learning to Trade I: Statistical Hedging. Lecture Notes Learning to Trade I: Statistical Hedging (June 30, 2022) (2022)."},{"key":"e_1_3_2_1_10_1","volume-title":"Lecture Notes Learning to Trade II: Deep Hedging. Lecture Notes Learning to Trade II: Deep Hedging (June 30","author":"Buehler Hans","year":"2022","unstructured":"Hans Buehler and Blanka Horvath. 2022. Lecture Notes Learning to Trade II: Deep Hedging. Lecture Notes Learning to Trade II: Deep Hedging (June 30, 2022) (2022)."},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"crossref","unstructured":"Hans B\u00fchler Lukas Gonon Josef Teichmann and Ben Wood. 2018. Deep Hedging.","DOI":"10.2139\/ssrn.3120710"},{"key":"e_1_3_2_1_12_1","volume-title":"Deep Hedging: Learning to Remove the Drift under Trading Frictions with Minimal Equivalent Near-Martingale Measures. arxiv:2111.07844\u00a0[q-fin.CP]","author":"B\u00fchler Hans","year":"2022","unstructured":"Hans B\u00fchler, Phillip Murray, Mikko\u00a0S. Pakkanen, and Ben Wood. 2022. Deep Hedging: Learning to Remove the Drift under Trading Frictions with Minimal Equivalent Near-Martingale Measures. arxiv:2111.07844\u00a0[q-fin.CP]"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"crossref","unstructured":"Hans B\u00fchler Phillip Murray and Ben Wood. 2023. Deep Bellman Hedging. arxiv:2207.00932\u00a0[q-fin.CP]","DOI":"10.2139\/ssrn.4151026"},{"key":"e_1_3_2_1_14_1","volume-title":"Decision transformer: Reinforcement learning via sequence modeling. Advances in neural information processing systems 34","author":"Chen Lili","year":"2021","unstructured":"Lili Chen, Kevin Lu, Aravind Rajeswaran, Kimin Lee, Aditya Grover, Misha Laskin, Pieter Abbeel, Aravind Srinivas, and Igor Mordatch. 2021. Decision transformer: Reinforcement learning via sequence modeling. Advances in neural information processing systems 34 (2021), 15084\u201315097."},{"key":"e_1_3_2_1_15_1","unstructured":"Ilya Chevyrev and Andrey Kormilitzin. 2016. A Primer on the Signature Method in Machine Learning."},{"key":"e_1_3_2_1_16_1","volume-title":"An image is worth 16x16 words: Transformers for image recognition at scale. arXiv preprint arXiv:2010.11929","author":"Dosovitskiy Alexey","year":"2020","unstructured":"Alexey Dosovitskiy, Lucas Beyer, Alexander Kolesnikov, Dirk Weissenborn, Xiaohua Zhai, Thomas Unterthiner, Mostafa Dehghani, Matthias Minderer, Georg Heigold, Sylvain Gelly, 2020. An image is worth 16x16 words: Transformers for image recognition at scale. arXiv preprint arXiv:2010.11929 (2020)."},{"volume-title":"A Course on Rough Paths: With an Introduction to Regularity Structures","author":"Friz K","key":"e_1_3_2_1_17_1","unstructured":"Peter\u00a0K Friz and Martin Hairer. 2020. A Course on Rough Paths: With an Introduction to Regularity Structures. Springer Nature."},{"volume-title":"Multidimensional stochastic processes as rough paths: theory and applications. Vol.\u00a0120","author":"Friz K","key":"e_1_3_2_1_18_1","unstructured":"Peter\u00a0K Friz and Nicolas\u00a0B Victoir. 2010. Multidimensional stochastic processes as rough paths: theory and applications. Vol.\u00a0120. Cambridge University Press."},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"crossref","unstructured":"Jim Gatheral Thibault Jaisson and Mathieu Rosenbaum. 2014. Volatility is rough. arxiv:1410.3394\u00a0[q-fin.ST]","DOI":"10.2139\/ssrn.2509457"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"crossref","unstructured":"Mor Geva Roei Schuster Jonathan Berant and Omer Levy. 2021. Transformer Feed-Forward Layers Are Key-Value Memories. arxiv:2012.14913\u00a0[cs.CL]","DOI":"10.18653\/v1\/2021.emnlp-main.446"},{"key":"e_1_3_2_1_21_1","volume-title":"A closed-form solution for options with stochastic volatility with applications to bond and currency options. The review of financial studies 6, 2","author":"Heston L","year":"1993","unstructured":"Steven\u00a0L Heston. 1993. A closed-form solution for options with stochastic volatility with applications to bond and currency options. The review of financial studies 6, 2 (1993), 327\u2013343."},{"key":"e_1_3_2_1_22_1","volume-title":"Multilayer feedforward networks are universal approximators. Neural networks 2, 5","author":"Hornik Kurt","year":"1989","unstructured":"Kurt Hornik, Maxwell Stinchcombe, and Halbert White. 1989. Multilayer feedforward networks are universal approximators. Neural networks 2, 5 (1989), 359\u2013366."},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"crossref","unstructured":"Blanka Horvath Josef Teichmann and Zan Zuric. 2021. Deep Hedging under Rough Volatility.","DOI":"10.2139\/ssrn.3778043"},{"key":"e_1_3_2_1_24_1","volume-title":"Optimal static-dynamic hedges for exotic options under convex risk measures. Stochastic Processes and their Applications 119, 10","author":"Ilhan Ayta\u00e7","year":"2009","unstructured":"Ayta\u00e7 Ilhan, Mattias Jonsson, and Ronnie Sircar. 2009. Optimal static-dynamic hedges for exotic options under convex risk measures. Stochastic Processes and their Applications 119, 10 (2009), 3608\u20133632."},{"key":"e_1_3_2_1_25_1","unstructured":"Patrick Kidger Patric Bonnier Imanol Perez\u00a0Arribas Cristopher Salvi and Terry Lyons. 2019. Deep Signature Transforms. In Advances in Neural Information Processing Systems H.\u00a0Wallach H.\u00a0Larochelle A.\u00a0Beygelzimer F.\u00a0d'Alch\u00e9-Buc E.\u00a0Fox and R.\u00a0Garnett (Eds.). 3099\u20133109."},{"key":"e_1_3_2_1_26_1","volume-title":"International Conference on Learning Representations.","author":"Kidger Patrick","year":"2021","unstructured":"Patrick Kidger and Terry Lyons. 2021. Signatory: differentiable computations of the signature and logsignature transforms, on both CPU and GPU. In International Conference on Learning Representations."},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1412.6980"},{"key":"e_1_3_2_1_28_1","first-page":"1","article-title":"Kernels for Sequentially Ordered Data","volume":"20","author":"Kiraly J.","year":"2019","unstructured":"Franz\u00a0J. Kiraly and Harald Oberhauser. 2019. Kernels for Sequentially Ordered Data. Journal of Machine Learning Research 20, 31 (2019), 1\u201345.","journal-title":"Journal of Machine Learning Research"},{"key":"e_1_3_2_1_29_1","unstructured":"Damian Kisiel and Denise Gorse. 2022. Portfolio Transformer for Attention-Based Asset Allocation. arxiv:2206.03246\u00a0[q-fin.PM]"},{"key":"e_1_3_2_1_30_1","unstructured":"Shiyang Li Xiaoyong Jin Yao Xuan Xiyou Zhou Wenhu Chen Yu-Xiang Wang and Xifeng Yan. 2020. Enhancing the Locality and Breaking the Memory Bottleneck of Transformer on Time Series Forecasting. arxiv:1907.00235\u00a0[cs.LG]"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"crossref","unstructured":"Yannick Limmer and Blanka Horvath. 2023. Robust Hedging GANs. arxiv:2307.02310\u00a0[q-fin.CP]","DOI":"10.2139\/ssrn.4489029"},{"key":"e_1_3_2_1_32_1","volume-title":"Rough paths, Signatures and the modelling of functions on streams. arXiv: Probability","author":"Lyons Terry","year":"2014","unstructured":"Terry Lyons. 2014. Rough paths, Signatures and the modelling of functions on streams. arXiv: Probability (2014)."},{"key":"e_1_3_2_1_33_1","unstructured":"Terry Lyons and Andrew\u00a0D. McLeod. 2023. Signature Methods in Machine Learning. arxiv:2206.14674\u00a0[stat.ML]"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"crossref","unstructured":"Terry Lyons Sina Nejad and Imanol\u00a0Perez Arribas. 2019. Nonparametric pricing and hedging of exotic derivatives.","DOI":"10.1080\/1350486X.2021.1891555"},{"key":"e_1_3_2_1_35_1","volume-title":"Differential equations driven by rough signals.Revista Matem\u00e1tica Iberoamericana 14, 2","author":"Lyons J.","year":"1998","unstructured":"Terry\u00a0J. Lyons. 1998. Differential equations driven by rough signals.Revista Matem\u00e1tica Iberoamericana 14, 2 (1998), 215\u2013310."},{"key":"e_1_3_2_1_36_1","series-title":"SIAM review 10, 4","volume-title":"Fractional Brownian motions, fractional noises and applications","author":"Mandelbrot B","year":"1968","unstructured":"Benoit\u00a0B Mandelbrot and John\u00a0W Van\u00a0Ness. 1968. Fractional Brownian motions, fractional noises and applications. SIAM review 10, 4 (1968), 422\u2013437."},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1080\/14697688.2018.1459812"},{"key":"e_1_3_2_1_38_1","unstructured":"James Morrill Adeline Fermanian Patrick Kidger and Terry Lyons. 2021. A Generalised Signature Method for Multivariate Time Series Feature Extraction. arxiv:2006.00873\u00a0[cs.LG]"},{"key":"e_1_3_2_1_39_1","unstructured":"James Morrill Cristopher Salvi Patrick Kidger James Foster and Terry Lyons. 2021. Neural Rough Differential Equations for Long Time Series. arxiv:2009.08295\u00a0[cs.LG]"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i10.17104"},{"key":"e_1_3_2_1_41_1","volume-title":"Composable Effects for Flexible and Accelerated Probabilistic Programming in NumPyro. arXiv preprint arXiv:1912.11554","author":"Phan Du","year":"2019","unstructured":"Du Phan, Neeraj Pradhan, and Martin Jankowiak. 2019. Composable Effects for Flexible and Accelerated Probabilistic Programming in NumPyro. arXiv preprint arXiv:1912.11554 (2019)."},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1017\/S0962492900002919"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1145\/3371237"},{"key":"e_1_3_2_1_44_1","series-title":"SIAM Journal on Mathematics of Data Science (jan","volume-title":"The Signature Kernel Is the Solution of a Goursat PDE","author":"Salvi Cristopher","year":"2021","unstructured":"Cristopher Salvi, Thomas Cass, James Foster, Terry Lyons, and Weixin Yang. 2021. The Signature Kernel Is the Solution of a Goursat PDE. SIAM Journal on Mathematics of Data Science (jan 2021), 873\u2013899."},{"key":"e_1_3_2_1_45_1","volume-title":"Learning Fractional White Noises in Neural Stochastic Differential Equations. In Thirty-Sixth Conference on Neural Information Processing Systems (NeurIPS). https:\/\/openreview.net\/forum?id=lTZBRxm2q5","author":"Tong Anh","year":"2022","unstructured":"Anh Tong, Thanh Nguyen-Tang, Toan Tran, and Jaesik Choi. 2022. Learning Fractional White Noises in Neural Stochastic Differential Equations. In Thirty-Sixth Conference on Neural Information Processing Systems (NeurIPS). https:\/\/openreview.net\/forum?id=lTZBRxm2q5"},{"key":"e_1_3_2_1_46_1","unstructured":"Ashish Vaswani Noam Shazeer Niki Parmar Jakob Uszkoreit Llion Jones Aidan\u00a0N. Gomez Lukasz Kaiser and Illia Polosukhin. 2017. Attention is All you Need. In NeurIPS."},{"key":"e_1_3_2_1_47_1","unstructured":"Qingsong Wen Tian Zhou Chaoli Zhang Weiqi Chen Ziqing Ma Junchi Yan and Liang Sun. 2023. Transformers in Time Series: A Survey. arxiv:2202.07125\u00a0[cs.LG]"},{"key":"e_1_3_2_1_48_1","doi-asserted-by":"publisher","DOI":"10.2307\/2331288"},{"key":"e_1_3_2_1_49_1","volume-title":"Autoformer: Decomposition Transformers with Auto-Correlation for Long-Term Series Forecasting. arxiv:2106.13008\u00a0[cs.LG]","author":"Wu Haixu","year":"2022","unstructured":"Haixu Wu, Jiehui Xu, Jianmin Wang, and Mingsheng Long. 2022. Autoformer: Decomposition Transformers with Auto-Correlation for Long-Term Series Forecasting. arxiv:2106.13008\u00a0[cs.LG]"},{"key":"e_1_3_2_1_50_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10436-005-0023-x"},{"key":"e_1_3_2_1_51_1","doi-asserted-by":"crossref","unstructured":"Ailing Zeng Muxi Chen Lei Zhang and Qiang Xu. 2023. Are Transformers Effective for Time Series Forecasting?Proceedings of the AAAI Conference on Artificial Intelligence.","DOI":"10.1609\/aaai.v37i9.26317"},{"key":"e_1_3_2_1_52_1","volume-title":"Informer: Beyond Efficient Transformer for Long Sequence Time-Series Forecasting. arxiv:2012.07436\u00a0[cs.LG]","author":"Zhou Haoyi","year":"2021","unstructured":"Haoyi Zhou, Shanghang Zhang, Jieqi Peng, Shuai Zhang, Jianxin Li, Hui Xiong, and Wancai Zhang. 2021. Informer: Beyond Efficient Transformer for Long Sequence Time-Series Forecasting. arxiv:2012.07436\u00a0[cs.LG]"},{"key":"e_1_3_2_1_53_1","doi-asserted-by":"publisher","DOI":"10.3390\/fractalfract7030225"}],"event":{"name":"ICAIF '23: 4th ACM International Conference on AI in Finance","acronym":"ICAIF '23","location":"Brooklyn NY USA"},"container-title":["4th ACM International Conference on AI in Finance"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3604237.3626841","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3604237.3626841","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T17:36:35Z","timestamp":1755884195000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3604237.3626841"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,11,25]]},"references-count":53,"alternative-id":["10.1145\/3604237.3626841","10.1145\/3604237"],"URL":"https:\/\/doi.org\/10.1145\/3604237.3626841","relation":{},"subject":[],"published":{"date-parts":[[2023,11,25]]},"assertion":[{"value":"2023-11-25","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}