{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,30]],"date-time":"2026-01-30T09:57:20Z","timestamp":1769767040574,"version":"3.49.0"},"reference-count":62,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"11","license":[{"start":{"date-parts":[[2025,11,1]],"date-time":"2025-11-01T00:00:00Z","timestamp":1761955200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2025,11,1]],"date-time":"2025-11-01T00:00:00Z","timestamp":1761955200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,11,1]],"date-time":"2025-11-01T00:00:00Z","timestamp":1761955200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62376135"],"award-info":[{"award-number":["62376135"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"National Research Foundation, Singapore and DSO National Laboratories"},{"name":"AI Singapore Programme","award":["AISG2-RP-2020-019"],"award-info":[{"award-number":["AISG2-RP-2020-019"]}]},{"name":"RIE 2020 Advanced Manufacturing and Engineering Singapore Programmatic Fund","award":["A20G8b0102"],"award-info":[{"award-number":["A20G8b0102"]}]},{"name":"Postdoctoral Fellowship Program of CPSF","award":["GZC20251641"],"award-info":[{"award-number":["GZC20251641"]}]},{"name":"Postdoctoral Innovation Program of Shandong Province","award":["SDCX-ZG-202502021"],"award-info":[{"award-number":["SDCX-ZG-202502021"]}]},{"DOI":"10.13039\/501100001459","name":"Ministry of Education - Singapore","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001459","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Academic Research Fund Tier 1","award":["RG101\/24"],"award-info":[{"award-number":["RG101\/24"]}]},{"name":"Shandong Key Laboratory of Artificial Intelligence Application for Livelihood Services","award":["PKL2024A45"],"award-info":[{"award-number":["PKL2024A45"]}]},{"name":"Shandong Higher Education Institution Laboratory of General Artificial Intelligence for Future Industries"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Pattern Anal. Mach. Intell."],"published-print":{"date-parts":[[2025,11]]},"DOI":"10.1109\/tpami.2025.3593657","type":"journal-article","created":{"date-parts":[[2025,7,29]],"date-time":"2025-07-29T18:30:15Z","timestamp":1753813815000},"page":"10770-10786","source":"Crossref","is-referenced-by-count":0,"title":["HPformer: Low-Parameter Transformer With Temporal Dependency Hierarchical Propagation for Health Informatics"],"prefix":"10.1109","volume":"47","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2838-8062","authenticated-orcid":false,"given":"Wu","family":"Lee","sequence":"first","affiliation":[{"name":"School of Software, Shandong University, Jinan, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1824-4244","authenticated-orcid":false,"given":"Yuliang","family":"Shi","sequence":"additional","affiliation":[{"name":"School of Software, Shandong University, Jinan, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6893-8650","authenticated-orcid":false,"given":"Han","family":"Yu","sequence":"additional","affiliation":[{"name":"School of Computer Science and Engineering, Nanyang Technological University, Singapore"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5484-3351","authenticated-orcid":false,"given":"Lin","family":"Cheng","sequence":"additional","affiliation":[{"name":"School of Software, Shandong University, Jinan, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8504-1028","authenticated-orcid":false,"given":"Xinjun","family":"Wang","sequence":"additional","affiliation":[{"name":"School of Software, Shandong University, Jinan, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5271-5417","authenticated-orcid":false,"given":"Zhongmin","family":"Yan","sequence":"additional","affiliation":[{"name":"School of Software, Shandong University, Jinan, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1369-6855","authenticated-orcid":false,"given":"Fanyu","family":"Kong","sequence":"additional","affiliation":[{"name":"School of Software, Shandong University, Jinan, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1162\/089976600300015015"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1207\/s15516709cog1402_1"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.8.1735"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/D14-1179"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1810.04805"},{"key":"ref7","article-title":"Improving language understanding by generative pre-training","author":"Radford","year":"2018"},{"issue":"8","key":"ref8","article-title":"Language models are unsupervised multitask learners","volume":"1","author":"Radford","year":"2019","journal-title":"OpenAI Blog"},{"key":"ref9","first-page":"1877","article-title":"Language models are few-shot learners","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Brown"},{"key":"ref10","first-page":"27 730","article-title":"Training language models to follow instructions with human feedback","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Ouyang"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/iccv48922.2021.00986"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"ref13","article-title":"An image is worth 16 x 16 words: Transformers for image recognition at scale","volume-title":"Proc. 9th Int. Conf. Learn. Representations","author":"Dosovitskiy"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.21437\/interspeech.2020-3015"},{"key":"ref15","first-page":"7004","article-title":"Transformer transducer: A streamable speech recognition model with transformer encoders and RNN-T loss","volume-title":"Proc. 2021 IEEE Int. Conf. Acoust. Speech Signal Process.","author":"Fan"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/icassp40776.2020.9053512"},{"key":"ref17","first-page":"8748","article-title":"Learning transferable visual models from natural language supervision","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Radford"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58577-8_8"},{"key":"ref19","first-page":"13","article-title":"VilBERT: Pretraining task-agnostic visiolinguistic representations for vision-and-language tasks","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Lu"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1514"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i07.6795"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1038\/s41597-019-0103-9"},{"key":"ref23","article-title":"Retain: An interpretable predictive model for healthcare using reverse time attention mechanism","author":"Choi","year":"2016"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1145\/3097983.3097997"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i01.5427"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1145\/3366423.3380136"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1145\/3394486.3403107"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1145\/3340531.3411864"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1145\/3530811"},{"key":"ref30","article-title":"Linformer: Self-attention with linear complexity","author":"Wang","year":"2020"},{"key":"ref31","article-title":"Rethinking attention with performers","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Choromanski"},{"key":"ref32","first-page":"24 226","article-title":"Flowformer: Linearizing transformers with conservation flows","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Wu"},{"key":"ref33","first-page":"17 413","article-title":"Scatterbrain: Unifying sparse and low-rank attention","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Chen"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.5040\/9781501365072.13350"},{"key":"ref35","first-page":"12 437","article-title":"Poolingformer: Long document modeling with pooling attention","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Zhang"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.findings-acl.346"},{"key":"ref37","article-title":"Generating long sequences with sparse transformers","author":"Child","year":"2019"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i12.17325"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.21236\/ADA594171"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1038\/sdata.2016.35"},{"key":"ref41","article-title":"MIMIC-IV (version 1.0)","author":"Johnson","year":"2020"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/TVCG.2018.2865027"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v32i1.11635"},{"key":"ref44","first-page":"17 413","article-title":"Scatterbrain: Unifying sparse and low-rank attention","volume-title":"Proc. 34th Annu. Conf. Neural Inf. Process. Syst.","author":"Chen"},{"key":"ref45","first-page":"16344","article-title":"FlashAttention: Fast and memory-efficient exact attention with IO-awareness","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Dao"},{"key":"ref46","article-title":"Layer normalization","author":"Ba","year":"2016"},{"key":"ref47","article-title":"Long range arena : A benchmark for efficient transformers","volume-title":"Proc. 9th Int. Conf. Learn. Representations","author":"Tay"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1137\/1.9781611975321.30"},{"key":"ref49","first-page":"4091","article-title":"Attend and diagnose: Clinical time series analysis using attention models","volume-title":"Proc. 32nd AAAI Conf. Artif. Intell.-30th Innov. Appl. Artif. Intell.-8th AAAI Symp. Educ. Adv. Artif. Intell.","author":"Song"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1016\/j.patrec.2005.10.010"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0092209"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1177\/001316446002000104"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1177\/001316448104100307"},{"key":"ref54","article-title":"Empirical evaluation of gated recurrent neural networks on sequence modeling","author":"Chung","year":"2014"},{"key":"ref55","article-title":"Adam: A method for stochastic optimization","author":"Kingma","year":"2014"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/5.58337"},{"key":"ref57","first-page":"5156","article-title":"Transformers are RNNs: Fast autoregressive transformers with linear attention","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Katharopoulos"},{"key":"ref58","first-page":"9438","article-title":"Sparse Sinkhorn Attention","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Tay"},{"key":"ref59","first-page":"10183","article-title":"Synthesizer: Rethinking self-attention in transformer models","volume-title":"Proc. Int. Conf. Mach. Learn.","author":"Tay"},{"key":"ref60","article-title":"Longformer: The long-document transformer","author":"Beltagy","year":"2020"},{"key":"ref61","first-page":"17283","article-title":"Big Bird: Transformers for longer sequences","volume-title":"Proc. Int. Conf. Neural Inf. Process. Syst.","author":"Zaheer"},{"key":"ref62","article-title":"cosFormer: Rethinking softmax in attention","volume-title":"Proc. Int. Conf. Learn. Representations","author":"Zhen"}],"container-title":["IEEE Transactions on Pattern Analysis and Machine Intelligence"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/34\/11192800\/11098976.pdf?arnumber=11098976","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,10,8]],"date-time":"2025-10-08T17:37:44Z","timestamp":1759945064000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11098976\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,11]]},"references-count":62,"journal-issue":{"issue":"11"},"URL":"https:\/\/doi.org\/10.1109\/tpami.2025.3593657","relation":{},"ISSN":["0162-8828","2160-9292","1939-3539"],"issn-type":[{"value":"0162-8828","type":"print"},{"value":"2160-9292","type":"electronic"},{"value":"1939-3539","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,11]]}}}