{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,13]],"date-time":"2026-04-13T21:23:36Z","timestamp":1776115416889,"version":"3.50.1"},"reference-count":37,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T00:00:00Z","timestamp":1777593600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T00:00:00Z","timestamp":1777593600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T00:00:00Z","timestamp":1777593600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-017"},{"start":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T00:00:00Z","timestamp":1777593600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"},{"start":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T00:00:00Z","timestamp":1777593600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-012"},{"start":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T00:00:00Z","timestamp":1777593600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T00:00:00Z","timestamp":1777593600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-004"}],"funder":[{"DOI":"10.13039\/100012541","name":"Guangdong Innovative and Entrepreneurial Research Team Program","doi-asserted-by":"publisher","award":["2023ZT10X044"],"award-info":[{"award-number":["2023ZT10X044"]}],"id":[{"id":"10.13039\/100012541","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001659","name":"Deutsche Forschungsgemeinschaft","doi-asserted-by":"publisher","award":["EXC 2077"],"award-info":[{"award-number":["EXC 2077"]}],"id":[{"id":"10.13039\/501100001659","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100007837","name":"Universit\u00e4t Bremen","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100007837","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62271432"],"award-info":[{"award-number":["62271432"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Pattern Recognition Letters"],"published-print":{"date-parts":[[2026,5]]},"DOI":"10.1016\/j.patrec.2026.03.005","type":"journal-article","created":{"date-parts":[[2026,3,9]],"date-time":"2026-03-09T09:33:17Z","timestamp":1773048797000},"page":"146-151","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":0,"special_numbering":"C","title":["The effect of speech representations on EEG-based auditory attention detection"],"prefix":"10.1016","volume":"203","author":[{"ORCID":"https:\/\/orcid.org\/0009-0002-5261-8091","authenticated-orcid":false,"given":"Haoqi","family":"Hu","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6069-4284","authenticated-orcid":false,"given":"Yuan","family":"Liao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3282-9246","authenticated-orcid":false,"given":"Siqi","family":"Cai","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9158-9401","authenticated-orcid":false,"given":"Haizhou","family":"Li","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"78","reference":[{"issue":"7","key":"10.1016\/j.patrec.2026.03.005_bib0001","doi-asserted-by":"crossref","first-page":"1697","DOI":"10.1093\/cercor\/bht355","article-title":"Attentional selection in a cocktail party environment can be decoded from single-trial EEG","volume":"25","author":"O\u2019sullivan","year":"2015","journal-title":"Cereb. Cortex"},{"issue":"3","key":"10.1016\/j.patrec.2026.03.005_bib0002","doi-asserted-by":"crossref","DOI":"10.1561\/116.00000128","article-title":"EEG-based auditory attention detection in cocktail party environment","volume":"12","author":"Cai","year":"2023","journal-title":"APSIPA Trans. Signal Inf. Process."},{"issue":"2","key":"10.1016\/j.patrec.2026.03.005_bib0003","doi-asserted-by":"crossref","first-page":"256","DOI":"10.1109\/THMS.2021.3125283","article-title":"EEG-based auditory attention detection via frequency and channel neural attention","volume":"52","author":"Cai","year":"2021","journal-title":"IEEE Trans. Hum. Mach. Syst."},{"key":"10.1016\/j.patrec.2026.03.005_bib0004","doi-asserted-by":"crossref","first-page":"28","DOI":"10.1016\/j.patrec.2023.10.011","article-title":"A jackknife-inspired deep learning approach to subject-independent classification of EEG","volume":"176","author":"Dolzhikova","year":"2023","journal-title":"Pattern Recognit. Lett."},{"key":"10.1016\/j.patrec.2026.03.005_bib0005","doi-asserted-by":"crossref","first-page":"57","DOI":"10.1016\/j.patrec.2025.09.011","article-title":"Toward interpretable schizophrenia detection from EEG using autoencoder and EfficientNet","volume":"198","author":"Mudavath","year":"2025","journal-title":"Pattern Recognit. Lett."},{"key":"10.1016\/j.patrec.2026.03.005_bib0006","doi-asserted-by":"crossref","first-page":"153","DOI":"10.3389\/fnins.2019.00153","article-title":"A tutorial on auditory attention identification methods","volume":"13","author":"Alickovic","year":"2019","journal-title":"Front. Neurosci."},{"issue":"7","key":"10.1016\/j.patrec.2026.03.005_bib0007","doi-asserted-by":"crossref","first-page":"2233","DOI":"10.1109\/TBME.2022.3140246","article-title":"STANet: a spatiotemporal attention network for decoding auditory spatial attention from EEG","volume":"69","author":"Su","year":"2022","journal-title":"IEEE Trans. Biomed. Eng."},{"issue":"1","key":"10.1016\/j.patrec.2026.03.005_bib0008","doi-asserted-by":"crossref","DOI":"10.1038\/s41598-021-94876-0","article-title":"Dynamic selective auditory attention detection using RNN and reinforcement learning","volume":"11","author":"Geravanchizadeh","year":"2021","journal-title":"Sci. Rep."},{"issue":"12","key":"10.1016\/j.patrec.2026.03.005_bib0009","doi-asserted-by":"crossref","first-page":"17387","DOI":"10.1109\/TNNLS.2023.3303308","article-title":"A bio-inspired spiking attentional neural network for attentional selection in the listening brain","volume":"35","author":"Cai","year":"2024","journal-title":"IEEE Trans. Neural Netw. Learn. Syst."},{"key":"10.1016\/j.patrec.2026.03.005_bib0010","doi-asserted-by":"crossref","DOI":"10.3389\/fnins.2021.652058","article-title":"Auditory attention detection via cross-modal attention","volume":"15","author":"Cai","year":"2021","journal-title":"Front. Neurosci."},{"key":"10.1016\/j.patrec.2026.03.005_bib0011","first-page":"31688","article-title":"DARNet: dual attention refinement network with spatiotemporal construction for auditory attention detection","volume":"37","author":"Yan","year":"2024","journal-title":"Adv. Neural Inf. Process. Syst."},{"issue":"5","key":"10.1016\/j.patrec.2026.03.005_bib0012","doi-asserted-by":"crossref","first-page":"858","DOI":"10.1038\/s41593-023-01304-9","article-title":"Semantic reconstruction of continuous language from non-invasive brain recordings","volume":"26","author":"Tang","year":"2023","journal-title":"Nat. Neurosci."},{"issue":"5","key":"10.1016\/j.patrec.2026.03.005_bib0013","doi-asserted-by":"crossref","first-page":"1465","DOI":"10.3758\/s13414-015-0882-9","article-title":"The cocktail-party problem revisited: early processing and selection of multi-talker speech","volume":"77","author":"Bronkhorst","year":"2015","journal-title":"Attention, Percept. Psychophys."},{"key":"10.1016\/j.patrec.2026.03.005_bib0014","series-title":"ICASSP 2024-2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","first-page":"1241","article-title":"Investigating self-supervised deep representations for EEG-based auditory attention decoding","author":"Thakkar","year":"2024"},{"issue":"3","key":"10.1016\/j.patrec.2026.03.005_bib0015","doi-asserted-by":"crossref","first-page":"583","DOI":"10.1093\/cercor\/bhp124","article-title":"Auditory attentional control and selection during cocktail party listening","volume":"20","author":"Hill","year":"2010","journal-title":"Cereb. Cortex"},{"issue":"11","key":"10.1016\/j.patrec.2026.03.005_bib0016","doi-asserted-by":"crossref","first-page":"4126","DOI":"10.1093\/cercor\/bhu131","article-title":"Impaired facilitatory mechanisms of auditory attention after damage of the lateral prefrontal cortex","volume":"25","author":"Bidet-Caulet","year":"2015","journal-title":"Cereb. Cortex"},{"key":"10.1016\/j.patrec.2026.03.005_bib0017","doi-asserted-by":"crossref","DOI":"10.1016\/j.neulet.2023.137534","article-title":"Music-oriented auditory attention detection from electroencephalogram","volume":"818","author":"Niu","year":"2024","journal-title":"Neurosci. Lett."},{"issue":"5","key":"10.1016\/j.patrec.2026.03.005_bib0018","doi-asserted-by":"crossref","first-page":"402","DOI":"10.1109\/TNSRE.2016.2571900","article-title":"Auditory-inspired speech envelope extraction methods for improved EEG-based auditory attention detection in a cocktail party scenario","volume":"25","author":"Biesmans","year":"2016","journal-title":"IEEE Trans. Neural Syst. Rehabil. Eng."},{"key":"10.1016\/j.patrec.2026.03.005_bib0019","doi-asserted-by":"crossref","first-page":"304","DOI":"10.1016\/j.patrec.2025.08.010","article-title":"Zero-shot KWS for children\u2019s speech using layer-wise features from SSL models","volume":"197","author":"Kutum","year":"2025","journal-title":"Pattern Recognit. Lett."},{"key":"10.1016\/j.patrec.2026.03.005_bib0020","series-title":"2023 45th Annual International Conference of the IEEE Engineering in Medicine & Biology Society (EMBC)","first-page":"1","article-title":"Predicting EEG responses to attended speech via deep neural networks for speech","author":"Alickovic","year":"2023"},{"key":"10.1016\/j.patrec.2026.03.005_bib0021","series-title":"Proceedings of the AAAI Conference on Artificial Intelligence","first-page":"25697","article-title":"Codec does matter: exploring the semantic shortcoming of codec for audio language model","volume":"39","author":"Ye","year":"2025"},{"key":"10.1016\/j.patrec.2026.03.005_bib0022","doi-asserted-by":"crossref","DOI":"10.3389\/frai.2025.1502504","article-title":"Reconstructing signal during brain stimulation with stim-BERT: a self-supervised learning model trained on millions of iEEG files","volume":"8","author":"Menon","year":"2025","journal-title":"Front. Artif. Intell."},{"issue":"5","key":"10.1016\/j.patrec.2026.03.005_bib0023","doi-asserted-by":"crossref","first-page":"803","DOI":"10.1016\/j.cub.2018.01.080","article-title":"Electrophysiological correlates of semantic dissimilarity reflect the comprehension of natural, narrative speech","volume":"28","author":"Broderick","year":"2018","journal-title":"Current Biol."},{"issue":"4","key":"10.1016\/j.patrec.2026.03.005_bib0024","doi-asserted-by":"crossref","DOI":"10.1371\/journal.pcbi.1013006","article-title":"Dynamic modeling of EEG responses to natural speech reveals earlier processing of predictable words","volume":"21","author":"Dou","year":"2025","journal-title":"PLoS Comput. Biol."},{"key":"10.1016\/j.patrec.2026.03.005_bib0025","doi-asserted-by":"crossref","first-page":"799","DOI":"10.1109\/OJSP.2023.3340063","article-title":"Attention and sequence modeling for match-mismatch classification of speech stimulus and EEG response","volume":"5","author":"Borsdorf","year":"2023","journal-title":"IEEE Open J. Signal Process."},{"key":"10.1016\/j.patrec.2026.03.005_bib0026","series-title":"International Conference on Intelligent Computing","first-page":"177","article-title":"HERMES: heterogeneous mixture of experts based on segments for auditory attention decoding","author":"Ma","year":"2025"},{"issue":"3","key":"10.1016\/j.patrec.2026.03.005_bib0027","doi-asserted-by":"crossref","first-page":"423","DOI":"10.1007\/s10548-014-0354-x","article-title":"Brain dynamics of distractibility: interaction between top-down and bottom-up mechanisms of auditory attention","volume":"28","author":"Bidet-Caulet","year":"2015","journal-title":"Brain Topogr."},{"issue":"8","key":"10.1016\/j.patrec.2026.03.005_bib0028","doi-asserted-by":"crossref","first-page":"1941","DOI":"10.1016\/j.ymssp.2005.07.002","article-title":"A new envelope algorithm of Hilbert\u2013Huang transform","volume":"20","author":"Qin","year":"2006","journal-title":"Mech. Syst. Signal Process."},{"issue":"11","key":"10.1016\/j.patrec.2026.03.005_bib0029","doi-asserted-by":"crossref","first-page":"1558","DOI":"10.1109\/PROC.1977.10770","article-title":"A unified approach to short-time fourier analysis and synthesis","volume":"65","author":"Allen","year":"2005","journal-title":"Proc. IEEE"},{"key":"10.1016\/j.patrec.2026.03.005_bib0030","first-page":"12449","article-title":"Wav2vec 2.0: a framework for self-supervised learning of speech representations","volume":"33","author":"Baevski","year":"2020","journal-title":"Adv. Neural Inf. Process. Syst."},{"issue":"4","key":"10.1016\/j.patrec.2026.03.005_bib0031","doi-asserted-by":"crossref","first-page":"2924","DOI":"10.1109\/TPAMI.2025.3529038","article-title":"Few-shot class-incremental learning for classification and object detection: a survey","volume":"47","author":"Zhang","year":"2025","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"10.1016\/j.patrec.2026.03.005_bib0032","first-page":"1","article-title":"WP-FSCIL: a well-prepared few-shot class-incremental learning framework for pill recognition","author":"Zhang","year":"2025","journal-title":"IEEE J. Biomed. Health Inform."},{"issue":"5","key":"10.1016\/j.patrec.2026.03.005_bib0033","doi-asserted-by":"crossref","first-page":"1136","DOI":"10.1109\/JPROC.2012.2237151","article-title":"Spoken language recognition: from fundamentals to practice","volume":"101","author":"Li","year":"2013","journal-title":"Proc. IEEE"},{"key":"10.1016\/j.patrec.2026.03.005_bib0034","series-title":"Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers)","first-page":"4171","article-title":"Bert: pre-training of deep bidirectional transformers for language understanding","author":"Devlin","year":"2019"},{"key":"10.1016\/j.patrec.2026.03.005_bib0035","series-title":"EEG and audio dataset for auditory attention decoding","author":"Fuglsang","year":"2018"},{"issue":"11","key":"10.1016\/j.patrec.2026.03.005_bib0036","first-page":"1919","article-title":"Based on audio-video evoked auditory attention detection electroencephalogram dataset","volume":"64","author":"Zhang","year":"2024","journal-title":"J. Tsinghua Univ. (Sci. Technol.)"},{"issue":"1","key":"10.1016\/j.patrec.2026.03.005_bib0037","doi-asserted-by":"crossref","DOI":"10.1088\/1741-2552\/ad2214","article-title":"What are we really decoding? Unveiling biases in EEG-based decoding of the spatial focus of auditory attention","volume":"21","author":"Rotaru","year":"2024","journal-title":"J. Neural Eng."}],"container-title":["Pattern Recognition Letters"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0167865526000929?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0167865526000929?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2026,4,13]],"date-time":"2026-04-13T20:25:48Z","timestamp":1776111948000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0167865526000929"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,5]]},"references-count":37,"alternative-id":["S0167865526000929"],"URL":"https:\/\/doi.org\/10.1016\/j.patrec.2026.03.005","relation":{},"ISSN":["0167-8655"],"issn-type":[{"value":"0167-8655","type":"print"}],"subject":[],"published":{"date-parts":[[2026,5]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"The effect of speech representations on EEG-based auditory attention detection","name":"articletitle","label":"Article Title"},{"value":"Pattern Recognition Letters","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.patrec.2026.03.005","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2026 Elsevier B.V. All rights are reserved, including those for text and data mining, AI training, and similar technologies.","name":"copyright","label":"Copyright"}]}}