{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,22]],"date-time":"2026-04-22T20:33:20Z","timestamp":1776890000588,"version":"3.51.2"},"reference-count":41,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2022,1,1]],"date-time":"2022-01-01T00:00:00Z","timestamp":1640995200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100010665","name":"H2020 Marie Skodowska-Curie Actions","doi-asserted-by":"publisher","award":["765068"],"award-info":[{"award-number":["765068"]}],"id":[{"id":"10.13039\/100010665","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Signal Process. Lett."],"published-print":{"date-parts":[[2022]]},"DOI":"10.1109\/lsp.2021.3135192","type":"journal-article","created":{"date-parts":[[2021,12,14]],"date-time":"2021-12-14T20:37:15Z","timestamp":1639514235000},"page":"344-348","source":"Crossref","is-referenced-by-count":6,"title":["A Convolutional-Attentional Neural Framework for Structure-Aware Performance-Score Synchronization"],"prefix":"10.1109","volume":"29","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-3609-9589","authenticated-orcid":false,"given":"Ruchit","family":"Agrawal","sequence":"first","affiliation":[],"role":[{"role":"author","vocab":"crossref"}]},{"given":"Daniel","family":"Wolff","sequence":"additional","affiliation":[],"role":[{"role":"author","vocab":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6098-481X","authenticated-orcid":false,"given":"Simon","family":"Dixon","sequence":"additional","affiliation":[],"role":[{"role":"author","vocab":"crossref"}]}],"member":"263","reference":[{"key":"ref1","first-page":"1727","article-title":"An on-line time warping algorithm for tracking musical performances","volume-title":"Proc. Int. Joint Conf. Artif. Intell.","author":"Dixon","year":"2005"},{"key":"ref2","doi-asserted-by":"crossref","DOI":"10.1007\/978-3-319-21945-5","volume-title":"Fundamentals of Music Processing: Audio, Analysis, Algorithms, Applications","author":"Mller","year":"2015"},{"key":"ref3","first-page":"784","article-title":"Learning to listen, read, and follow: Score following as a reinforcement learning game","volume-title":"Proc. Int. Soc. Music Inf. Retrieval Conf.","author":"Dorfer","year":"2018"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP39728.2021.9414049"},{"key":"ref5","first-page":"115","article-title":"Learning audio-sheet music correspondences for score identification and offline alignment","volume-title":"Proc. 18th Int. Soc. Music Inf. Retrieval Conf.","author":"Dorfer","year":"2017"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.23919\/Eusipco47968.2020.9287625"},{"key":"ref7","first-page":"68","article-title":"Stand-alone self-attention in vision models","volume-title":"Proc. 33rd Conf. Neural Inf. Process. Syst.","author":"Ramachandran","year":"2019"},{"key":"ref8","first-page":"894","article-title":"Soft-DTW: A differentiable loss function for time-series","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Cuturi","year":"2017"},{"key":"ref9","first-page":"365","article-title":"Towards an efficient algorithm for automatic score-to-audio synchronization","volume-title":"Proc. Int. Conf. Music Inf. Retrieval","author":"Mller","year":"2004"},{"key":"ref10","first-page":"192","article-title":"An efficient multiscale approach to audio synchronization","volume-title":"Proc. Int. Conf. Music Inf. Retrieval","author":"Mller","year":"2006"},{"key":"ref11","first-page":"241","article-title":"Automatic page turning for musicians via real-time machine listening","volume-title":"Proc. 18th Eur. Conf. Artif. Intell.","author":"Arzt","year":"2008"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2005.1415694"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2011.5946371"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/MLSP.2014.6958908"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2015-667"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-642-02518-1_10"},{"key":"ref17","first-page":"2286","article-title":"Canonical time warping for alignment of human behavior","volume":"22","author":"Zhou","year":"2009","journal-title":"Ad. Neural Inf. Process. Syst."},{"key":"ref18","first-page":"24","article-title":"Towards effective any-time music tracking","volume-title":"Proc. 5th Starting AI Researchers Symp.","author":"Arzt","year":"2010"},{"key":"ref19","first-page":"742","article-title":"An audio to score alignment framework using spectral factorization and dynamic time warping","volume-title":"Proc. Int. Soc. Music Inf. Retrieval Conf.","author":"Carabias-Orti","year":"2015"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/ICMLA.2016.0142"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2016.2598318"},{"key":"ref22","article-title":"A hybrid approach to audio-to-score alignment","volume-title":"Proc. Mach. Learn. Media Discov. Workshop Int. Conf. Mach. Learn.","author":"Agrawal","year":"2019"},{"key":"ref23","first-page":"91","article-title":"MIDI-sheet music alignment using bootleg score synthesis","volume-title":"Proc. Int. Soc. Music Inf. Retrieval","author":"Tanprasert","year":"2019"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2017.2710047"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00912"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9054121"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.5334\/tismir.12"},{"key":"ref28","first-page":"780","article-title":"Learning to read and follow music in complete score sheet images","volume-title":"Proc. 21th Int. Soc. Music Inf. Retrieval Conf.","author":"Henkel","year":"2020"},{"key":"ref29","article-title":"Audio-conditioned U-Net for position estimation in full sheet images","volume-title":"Proc. Int. Workshop Reading Music Syst.","author":"Henkel","year":"2019"},{"key":"ref30","first-page":"243","article-title":"Handling repeats and jumps in score-performance synchronization","volume-title":"Proc. Int. Soc. Music Inf. Retrieval Conf.","author":"Fremerey","year":"2010"},{"key":"ref31","first-page":"607","article-title":"Automatic alignment of music performances with structural differences","volume-title":"Proc. 14th Int. Soc. Music Inf. Retrieval Conf.","author":"Grachten","year":"2013"},{"key":"ref32","first-page":"6000","article-title":"Attention is all you need","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Vaswani","year":"2017"},{"key":"ref33","article-title":"Attention U-net: Learning where to look for the pancreas","volume-title":"Proc. 1st Conf. Med. Imag. With Deep Learn.","author":"Oktay","year":"2018"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10590-1_53"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.23915\/distill.00003"},{"key":"ref36","first-page":"3853","article-title":"Differentiable divergences between time series","volume-title":"Proc. Int. Conf. Artif. Intell. Statist.","author":"Blondel","year":"2021"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.25080\/majora-7b98e3ed-003"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1007\/s13398-014-0173-7.2"},{"key":"ref39","first-page":"85","article-title":"Mazurka-BL: Score-aligned loudness, beat, expressive markings data for 2000 Chopin mazurka recordings","volume-title":"Proc. 4th Int. Conf. Technol. Music Notation Representation","author":"Kosta","year":"2018"},{"key":"ref40","first-page":"315","article-title":"Evaluation of real-time audio-to-score alignment","volume-title":"Proc. Int. Conf. Music Inf. Retrieval","author":"Cont","year":"2007"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1016\/S0169-2070(96)00719-4"}],"container-title":["IEEE Signal Processing Letters"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/97\/9686799\/09650716.pdf?arnumber=9650716","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,1,10]],"date-time":"2024-01-10T00:31:12Z","timestamp":1704846672000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9650716\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022]]},"references-count":41,"URL":"https:\/\/doi.org\/10.1109\/lsp.2021.3135192","relation":{},"ISSN":["1070-9908","1558-2361"],"issn-type":[{"value":"1070-9908","type":"print"},{"value":"1558-2361","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022]]}}}