{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,17]],"date-time":"2026-06-17T16:37:12Z","timestamp":1781714232495,"version":"3.54.5"},"reference-count":39,"publisher":"IEEE","license":[{"start":{"date-parts":[[2024,9,9]],"date-time":"2024-09-09T00:00:00Z","timestamp":1725840000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2024,9,9]],"date-time":"2024-09-09T00:00:00Z","timestamp":1725840000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024,9,9]]},"DOI":"10.1109\/iwaenc61483.2024.10694313","type":"proceedings-article","created":{"date-parts":[[2024,10,4]],"date-time":"2024-10-04T17:31:16Z","timestamp":1728063076000},"page":"205-209","source":"Crossref","is-referenced-by-count":24,"title":["TF-Locoformer: Transformer with Local Modeling by Convolution for Speech Separation and Enhancement"],"prefix":"10.1109","author":[{"given":"Kohei","family":"Saijo","sequence":"first","affiliation":[{"name":"Mitsubishi Electric Research Laboratories (MERL),Cambridge,MA,USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Gordon","family":"Wichern","sequence":"additional","affiliation":[{"name":"Mitsubishi Electric Research Laboratories (MERL),Cambridge,MA,USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Fran\u00e7ois G.","family":"Germain","sequence":"additional","affiliation":[{"name":"Mitsubishi Electric Research Laboratories (MERL),Cambridge,MA,USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Zexu","family":"Pan","sequence":"additional","affiliation":[{"name":"Mitsubishi Electric Research Laboratories (MERL),Cambridge,MA,USA"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Jonathan Le","family":"Roux","sequence":"additional","affiliation":[{"name":"Mitsubishi Electric Research Laboratories (MERL),Cambridge,MA,USA"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2016.7471631"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2019.2915167"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9054266"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-2205"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP39728.2021.9413901"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP43922.2022.9747554"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2023.3304482"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/IWAENC53105.2022.9914794"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.5555\/3295222.3295349"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2022-700"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/icassp48485.2024.10445985"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU46091.2019.9003750"},{"key":"ref13","article-title":"An image is worth 16x16 words: Transformers for image recognition at scale","volume-title":"Proc. ICLR","author":"Dosovitskiy"},{"key":"ref14","article-title":"Robust speech recognition via large-scale weak supervision","volume-title":"Proc. ICML","author":"Radford"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/ASRU57964.2023.10389733"},{"key":"ref16","article-title":"Scaling laws for neural language models","author":"Kaplan","year":"2020"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2021-1644"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01179"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2020-3015"},{"key":"ref20","article-title":"Understanding and improving transformer from a multi-particle dynamic system point of view","volume-title":"ICLR 2020 Workshop on Integration of Deep Neural Models and Differential Equations","author":"Lu"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1016\/j.neucom.2023.127063"},{"key":"ref22","article-title":"GLU variants improve Transformer","author":"Shazeer","year":"2020"},{"key":"ref23","article-title":"Root mean square layer normalization","volume-title":"Proc. NeurIPS","author":"Zhang"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01261-8_1"},{"key":"ref25","article-title":"LibriMix: An open-source dataset for generalizable speech separation","author":"Cosentino","year":"2020"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9053327"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2020-3038"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2015.7178964"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/SLT48900.2021.9383615"},{"key":"ref30","article-title":"Decoupled weight decay regularization","volume-title":"Proc. ICLR","author":"Loshchilov"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2017.7952154"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/icassp.2019.8683855"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP43922.2022.9747146"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TSA.2005.858005"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/TASL.2011.2114881"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2001.941023"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2021.3099291"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP48485.2024.10446032"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.21437\/Interspeech.2023-339"}],"event":{"name":"2024 18th International Workshop on Acoustic Signal Enhancement (IWAENC)","location":"Aalborg, Denmark","start":{"date-parts":[[2024,9,9]]},"end":{"date-parts":[[2024,9,12]]}},"container-title":["2024 18th International Workshop on Acoustic Signal Enhancement (IWAENC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10693863\/10693957\/10694313.pdf?arnumber=10694313","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,5]],"date-time":"2024-10-05T07:38:00Z","timestamp":1728113880000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10694313\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,9,9]]},"references-count":39,"URL":"https:\/\/doi.org\/10.1109\/iwaenc61483.2024.10694313","relation":{},"subject":[],"published":{"date-parts":[[2024,9,9]]}}}