{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,22]],"date-time":"2026-04-22T19:28:10Z","timestamp":1776886090236,"version":"3.51.2"},"reference-count":34,"publisher":"Tsinghua University Press","issue":"4","funder":[{"DOI":"10.13039\/501100012166","name":"National Key R&D Program of China","doi-asserted-by":"publisher","award":["2022ZD0160705,2022ZD0160704"],"award-info":[{"award-number":["2022ZD0160705,2022ZD0160704"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["Big Data Min. Anal."],"published-print":{"date-parts":[[2024,12]]},"DOI":"10.26599\/bdma.2024.9020044","type":"journal-article","created":{"date-parts":[[2024,12,4]],"date-time":"2024-12-04T19:23:58Z","timestamp":1733340238000},"page":"1116-1128","source":"Crossref","is-referenced-by-count":22,"title":["MedBench: A Comprehensive, Standardized, and Reliable Benchmarking System for Evaluating Chinese Medical Large Language Models"],"prefix":"10.26599","volume":"7","author":[{"given":"Mianxin","family":"Liu","sequence":"first","affiliation":[{"name":"Shanghai Artificial Intelligence Laboratory,Shanghai,China,200232"}]},{"given":"Weiguo","family":"Hu","sequence":"additional","affiliation":[{"name":"Ruijin Hospital Affiliated to Shanghai Jiao Tong University, School of Medicine,Shanghai,China,200025"}]},{"given":"Jinru","family":"Ding","sequence":"additional","affiliation":[{"name":"Shanghai Artificial Intelligence Laboratory,Shanghai,China,200232"}]},{"given":"Jie","family":"Xu","sequence":"additional","affiliation":[{"name":"Shanghai Artificial Intelligence Laboratory,Shanghai,China,200232"}]},{"given":"Xiaoyang","family":"Li","sequence":"additional","affiliation":[{"name":"Shanghai Artificial Intelligence Laboratory,Shanghai,China,200232"}]},{"given":"Lifeng","family":"Zhu","sequence":"additional","affiliation":[{"name":"Ruijin Hospital Affiliated to Shanghai Jiao Tong University, School of Medicine,Shanghai,China,200025"}]},{"given":"Zhian","family":"Bai","sequence":"additional","affiliation":[{"name":"Ruijin Hospital Affiliated to Shanghai Jiao Tong University, School of Medicine,Shanghai,China,200025"}]},{"given":"Xiaoming","family":"Shi","sequence":"additional","affiliation":[{"name":"Shanghai Artificial Intelligence Laboratory,Shanghai,China,200232"}]},{"given":"Benyou","family":"Wang","sequence":"additional","affiliation":[{"name":"The Chinese University of Hong Kong,Shenzhen,China,518172"}]},{"given":"Haitao","family":"Song","sequence":"additional","affiliation":[{"name":"Shanghai Artificial Intelligence Research Institute,Shanghai,200240"}]},{"given":"Pengfei","family":"Liu","sequence":"additional","affiliation":[{"name":"School of Electronic Information and Electrical Engineering, Shanghai Jiao Tong University,Shanghai,China,200240"}]},{"given":"Xiaofan","family":"Zhang","sequence":"additional","affiliation":[{"name":"Qing Yuan Research Institute, Shanghai Jiao Tong University,Shanghai,China,200240"}]},{"given":"Shanshan","family":"Wang","sequence":"additional","affiliation":[{"name":"Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences,Shenzhen,China,518055"}]},{"given":"Kang","family":"Li","sequence":"additional","affiliation":[{"name":"West China Hospital, Sichuan University,Chengdu,China,610041"}]},{"given":"Haofen","family":"Wang","sequence":"additional","affiliation":[{"name":"School of Design and Innovation, Tongji University,Shanghai,China,200092"}]},{"given":"Tong","family":"Ruan","sequence":"additional","affiliation":[{"name":"East China University of Science and Technology,Department of Computer Science and Technology,Shanghai,China,200237"}]},{"given":"Xuanjing","family":"Huang","sequence":"additional","affiliation":[{"name":"School of Computer Science, Fudan University,Shanghai,China,200433"}]},{"given":"Xin","family":"Sun","sequence":"additional","affiliation":[{"name":"Xinhua Hospital Affiliated to Shanghai Jiaotong University School of Medicine,Shanghai,China,200092"}]},{"given":"Shaoting","family":"Zhang","sequence":"additional","affiliation":[{"name":"Shanghai Artificial Intelligence Laboratory,Shanghai,China,200232"}]}],"member":"11138","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1038\/s41591-023-02448-8"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1038\/s41591-023-02700-1"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1038\/s41586-023-06455-0"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.emnlp-main.698"},{"key":"ref5","author":"Liu","year":"2023","journal-title":"Benchmarking large language models on CMExam: A comprehensive Chinese medical exam dataset"},{"key":"ref6","article-title":"CMB: A comprehensive medical benchmark in Chinese","author":"Wang","year":"2023","journal-title":"arXiv preprint"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.acl-long.544"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1056\/aidbp2300092"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1016\/j.ebiom.2023.104770"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.naacl-long.263"},{"key":"ref11","author":"Zhou","year":"2023","journal-title":"Don\u2019t make your LLM an evaluation benchmark cheater"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1097\/JS9.0000000000000373"},{"key":"ref13","article-title":"OpenMEDLab: An open-source platform for multi-modality foundation models in medicine","author":"Wang","year":"2024","journal-title":"arXiv preprint"},{"key":"ref14","author":"Zeng","year":"2022","journal-title":"GLM-130B: An open bilingual pre-trained model"},{"key":"ref15","article-title":"Hua Tuo: Tuning LLaMA model with Chinese medical knowledge","author":"Wang","year":"2023","journal-title":"arXiv preprint"},{"key":"ref16","article-title":"BianQue: Balancing the questioning and suggestion ability of health LLMs with multi-turn health conversations polished by ChatGPT","author":"Chen","year":"2023","journal-title":"arXiv preprint"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.3115\/1073083.1073135"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.3115\/1218955.1219032"},{"issue":"3","key":"ref19","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1145\/3641289","volume":"15","author":"Chang","year":"2024","journal-title":"ACM Trans. Intell. Syst. Technol."},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1016\/j.cogsys.2019.09.025"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/3632971.3632980"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1145\/3539597.3573023"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1093\/bib\/bbae145"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1038\/s41467-023-42528-4"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1016\/j.ebiom.2019.01.023"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-43996-4_10"},{"key":"ref27","author":"Cheng","journal-title":"SAM-Med2D"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2023.102996"},{"key":"ref29","article-title":"Data-centric foundation models in computational healthcare: A survey","author":"Zhang","year":"2024","journal-title":"arXiv preprint"},{"key":"ref30","article-title":"LLaVA-med: Training a large language-and-vision assistant for biomedicine in one day","author":"Li","year":"2023","journal-title":"arXiv preprint"},{"key":"ref31","article-title":"Capabilities of gemini models in medicine","author":"Saab","year":"2024","journal-title":"arXiv preprint"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1038\/s41597-023-02460-0"},{"key":"ref33","author":"Hu","year":"2024","journal-title":"Omni MedVQA: A new large-scale comprehensive evaluation benchmark for medical LVLM"},{"key":"ref34","year":"2023","journal-title":"A universal evaluation platform for foundation models"}],"container-title":["Big Data Mining and Analytics"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/8254253\/10778131\/10778138.pdf?arnumber=10778138","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,12,5]],"date-time":"2024-12-05T06:07:09Z","timestamp":1733378829000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10778138\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,12]]},"references-count":34,"journal-issue":{"issue":"4"},"URL":"https:\/\/doi.org\/10.26599\/bdma.2024.9020044","relation":{},"ISSN":["2096-0654","2097-406X"],"issn-type":[{"value":"2096-0654","type":"print"},{"value":"2097-406X","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,12]]}}}