{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,3]],"date-time":"2026-06-03T01:08:38Z","timestamp":1780448918450,"version":"3.54.1"},"reference-count":31,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,4,6]],"date-time":"2025-04-06T00:00:00Z","timestamp":1743897600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,4,6]],"date-time":"2025-04-06T00:00:00Z","timestamp":1743897600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,4,6]]},"DOI":"10.1109\/icassp49660.2025.10889045","type":"proceedings-article","created":{"date-parts":[[2025,3,12]],"date-time":"2025-03-12T17:15:19Z","timestamp":1741799719000},"page":"1-5","source":"Crossref","is-referenced-by-count":2,"title":["Extract Information from Hybrid Long Documents Leveraging LLMs: A Framework and Dataset"],"prefix":"10.1109","author":[{"given":"Chongjian","family":"Yue","sequence":"first","affiliation":[{"name":"Peking University,School of Software &#x0026; Microelectronics,Beijing,China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Xinrun","family":"Xu","sequence":"additional","affiliation":[{"name":"Institute of Software,Chinese Academy of Sciences,Beijing,China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Xiaojun","family":"Ma","sequence":"additional","affiliation":[{"name":"Microsoft,Beijing,China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Lun","family":"Du","sequence":"additional","affiliation":[{"name":"Ant Group,Beijing,China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Zhiming","family":"Ding","sequence":"additional","affiliation":[{"name":"Institute of Software,Chinese Academy of Sciences,Beijing,China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Shi","family":"Han","sequence":"additional","affiliation":[{"name":"Microsoft,Beijing,China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Dongmei","family":"Zhang","sequence":"additional","affiliation":[{"name":"Microsoft,Beijing,China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Qi","family":"Zhang","sequence":"additional","affiliation":[{"name":"Microsoft,Beijing,China"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref1","article-title":"Chain-of-thought prompting elicits reasoning in large language models","author":"Wei","year":"2023"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i16.29779"},{"key":"ref3","article-title":"A survey on game playing agents and large models: Methods, applications, and challenges","author":"Xu","year":"2024"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.findings-emnlp.588"},{"key":"ref5","article-title":"Enabling and analyzing how to efficiently extract information from hybrid long documents with llms","author":"Yue","year":"2023"},{"key":"ref6","first-page":"22199","article-title":"Large language models are zero-shot reasoners","volume":"35","author":"Kojima","year":"2022","journal-title":"Advances in neural information processing systems"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.findings-eacl.83"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1145\/3539618.3591708"},{"key":"ref9","article-title":"Cradle: Empowering foundation agents towards general computer control","volume-title":"NeurIPS 2024 Workshop on Open-World Agents","author":"Tan"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1145\/3447548.3467101"},{"key":"ref11","article-title":"Can large language models recall reference location like humans?","author":"Wang","year":"2024"},{"key":"ref12","article-title":"Mllm as retriever: Interactively learning multimodal retrieval for embodied agents","author":"Yue","year":"2024"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D19-1410"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.conll-1.52"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1039\/d4dd00016a"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1145\/3342558.3345420"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1145\/3397271.3401406"},{"key":"ref18","article-title":"Exploring word representations on time expression recognition","author":"Chen","year":"2019","journal-title":"Microsoft Research Technical Report MSR-TR-2019-46"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR56361.2022.9956191"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.emnlp-main.300"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.acl-long.254"},{"key":"ref22","first-page":"6588","article-title":"MultiHiertt: Numerical reasoning over multi hierarchical tabular and textual data","volume-title":"Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers)","author":"Zhao"},{"key":"ref23","article-title":"Unleashing infinite-length input capacity for large-scale language models with self-controlled memory system","author":"Liang","year":"2023"},{"key":"ref24","article-title":"Evaluating chatgpt\u2019s information extraction capabilities: An assessment of performance, explainability, calibration, and faithfulness","author":"Li","year":"2023"},{"key":"ref25","article-title":"Zero-shot information extraction via chatting with chatgpt","author":"Wei","year":"2023"},{"key":"ref26","article-title":"Context-ner: Contextual phrase generation at scale","author":"Gupta","year":"2021"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2025.findings-naacl.239"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.emnlp-main.214"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.sustainlp-1.13"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/ICDMW60847.2023.00073"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.14778\/3626292.3626294"}],"event":{"name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","location":"Hyderabad, India","start":{"date-parts":[[2025,4,6]]},"end":{"date-parts":[[2025,4,11]]}},"container-title":["ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/10887540\/10887541\/10889045.pdf?arnumber=10889045","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,25]],"date-time":"2026-03-25T05:22:09Z","timestamp":1774416129000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10889045\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,4,6]]},"references-count":31,"URL":"https:\/\/doi.org\/10.1109\/icassp49660.2025.10889045","relation":{},"subject":[],"published":{"date-parts":[[2025,4,6]]}}}