{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,15]],"date-time":"2026-05-15T04:12:05Z","timestamp":1778818325565,"version":"3.51.4"},"reference-count":52,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-017"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-012"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-004"}],"funder":[{"DOI":"10.13039\/501100013290","name":"National Key Research and Development Program of China Stem Cell and Translational Research","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100013290","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Advanced Engineering Informatics"],"published-print":{"date-parts":[[2026,9]]},"DOI":"10.1016\/j.aei.2026.104726","type":"journal-article","created":{"date-parts":[[2026,4,26]],"date-time":"2026-04-26T17:42:45Z","timestamp":1777225365000},"page":"104726","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":0,"special_numbering":"PB","title":["XFD-LVLM: An explainable multimodal framework for aviation hydraulic pump intelligent fault diagnosis with large Vision-Language models"],"prefix":"10.1016","volume":"74","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9772-6515","authenticated-orcid":false,"given":"Quanning","family":"Xu","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zihao","family":"Lei","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Guangrui","family":"Wen","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shulong","family":"Gu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yu","family":"Su","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhibin","family":"Zhao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xuefeng","family":"Chen","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"78","reference":[{"key":"10.1016\/j.aei.2026.104726_b0005","doi-asserted-by":"crossref","DOI":"10.1016\/j.ymssp.2024.111115","article-title":"High imbalance fault diagnosis of aviation hydraulic pump based on data augmentation via local wavelet similarity fusion[J]","volume":"209","author":"Fu","year":"2024","journal-title":"Mech. Syst. Sig. Process."},{"key":"10.1016\/j.aei.2026.104726_b0010","doi-asserted-by":"crossref","DOI":"10.1016\/j.aei.2024.102459","article-title":"Fault diagnosis study of hydraulic pump based on improved symplectic geometry reconstruction data enhancement method[J]","volume":"61","author":"Liu","year":"2024","journal-title":"Adv. Eng. Inf."},{"issue":"6","key":"10.1016\/j.aei.2026.104726_b0015","doi-asserted-by":"crossref","first-page":"3757","DOI":"10.1109\/TIE.2015.2417501","article-title":"A survey of fault diagnosis and fault-tolerant techniques\u2014Part I: fault diagnosis with model-based and signal-based approaches[J]","volume":"62","author":"Gao","year":"2015","journal-title":"IEEE Trans. Ind. Electron."},{"issue":"8","key":"10.1016\/j.aei.2026.104726_b0020","doi-asserted-by":"crossref","first-page":"3979","DOI":"10.1016\/j.jfranklin.2022.02.025","article-title":"Active fault diagnosis for a class of closed-loop systems via parameter estimation[J]","volume":"359","author":"Jia","year":"2022","journal-title":"J. Franklin Inst."},{"key":"10.1016\/j.aei.2026.104726_b0025","article-title":"Spatial-temporal graph feature learning driven by time-frequency similarity assessment for robust fault diagnosis of rotating machinery[J]","volume":"62","author":"Wang","year":"2024","journal-title":"Adv. Eng. Inf."},{"key":"10.1016\/j.aei.2026.104726_b0030","doi-asserted-by":"crossref","DOI":"10.1016\/j.aei.2024.103041","article-title":"A novel fault diagnosis method based on nonlinear-CWT and improved YOLOv8 for axial piston pump using output pressure signal[J]","volume":"64","author":"Xia","year":"2025","journal-title":"Adv. Eng. Inf."},{"key":"10.1016\/j.aei.2026.104726_b0035","doi-asserted-by":"crossref","DOI":"10.1016\/j.ymssp.2020.107161","article-title":"Coherence analysis to detect unsteady rotating stall phenomenon based on pressure pulsation signals of a centrifugal pump[J]","volume":"148","author":"Zhang","year":"2021","journal-title":"Mech. Syst. Sig. Process."},{"key":"10.1016\/j.aei.2026.104726_b0040","doi-asserted-by":"crossref","first-page":"95","DOI":"10.1016\/j.inffus.2022.09.013","article-title":"A synchronous holo-balancing method for flexible rotors based on the modified initial phase vector[J]","volume":"90","author":"Lei","year":"2023","journal-title":"Inf. Fusion"},{"key":"10.1016\/j.aei.2026.104726_b0045","doi-asserted-by":"crossref","DOI":"10.1016\/j.ymssp.2025.112896","article-title":"SFUGDA: Source-free unsupervised multiscale graph domain adaptation network with privacy-preserving for cross-domain fault diagnosis of offshore wind turbines[J]","volume":"235","author":"Lei","year":"2025","journal-title":"Mech. Syst. Sig. Process."},{"key":"10.1016\/j.aei.2026.104726_b0050","doi-asserted-by":"crossref","DOI":"10.1016\/j.inffus.2025.103277","article-title":"HSE: a plug-and-play module for unified fault diagnosis foundation models[J]","volume":"123","author":"Li","year":"2025","journal-title":"Inf. Fusion"},{"key":"10.1016\/j.aei.2026.104726_b0055","first-page":"1","article-title":"A novel unsupervised graph wavelet autoencoder for mechanical system fault detection[J]","author":"Li","year":"2024","journal-title":"J. Intell. Manuf."},{"key":"10.1016\/j.aei.2026.104726_b0060","article-title":"Explainable artificial intelligence based intelligent fault diagnosis: a systematic review from applications to insights[J]","volume":"111935","author":"Li","year":"2025","journal-title":"Reliab. Eng. Syst. Saf."},{"key":"10.1016\/j.aei.2026.104726_b0065","doi-asserted-by":"crossref","DOI":"10.1016\/j.lindif.2023.102274","article-title":"ChatGPT for good? on opportunities and challenges of large language models for education[J]","volume":"103","author":"Kasneci","year":"2023","journal-title":"Learn. Individ. Differ."},{"issue":"8","key":"10.1016\/j.aei.2026.104726_b0070","doi-asserted-by":"crossref","first-page":"1930","DOI":"10.1038\/s41591-023-02448-8","article-title":"Large language models in medicine[J]","volume":"29","author":"Thirunavukarasu","year":"2023","journal-title":"Nat. Med."},{"key":"10.1016\/j.aei.2026.104726_b0075","doi-asserted-by":"crossref","DOI":"10.1016\/j.ymssp.2024.112127","article-title":"LLM-based framework for bearing fault diagnosis[J]","volume":"224","author":"Tao","year":"2025","journal-title":"Mech. Syst. Sig. Process."},{"key":"10.1016\/j.aei.2026.104726_b0080","doi-asserted-by":"crossref","first-page":"557","DOI":"10.1016\/j.jmsy.2026.02.016","article-title":"A Multi-Agent and synergistic Knowledge Graph retrieval-augmented generation framework for intelligent maintenance[J]","volume":"85","author":"Lin","year":"2026","journal-title":"J. Manuf. Syst."},{"key":"10.1016\/j.aei.2026.104726_b0085","unstructured":"Shu H, Wang Y, Song W, et al. Forecasting the Future with Future Technologies: Advancements in Large Meteorological Models[J]. arXiv preprint arXiv:2404.06668, 2024."},{"key":"10.1016\/j.aei.2026.104726_b0090","doi-asserted-by":"crossref","DOI":"10.1016\/j.aei.2025.103524","article-title":"Integrating large models with topology optimization for conceptual design realization[J]","volume":"67","author":"Liang","year":"2025","journal-title":"Adv. Eng. Inf."},{"key":"10.1016\/j.aei.2026.104726_b0095","doi-asserted-by":"crossref","DOI":"10.1016\/j.aei.2025.103997","article-title":"Deep digital twin-powered large vision-language model for multi-scenario industrial fault diagnosis[J]","volume":"69","author":"Xu","year":"2026","journal-title":"Adv. Eng. Inf."},{"key":"10.1016\/j.aei.2026.104726_b0100","doi-asserted-by":"crossref","DOI":"10.1016\/j.ress.2024.110312","article-title":"ParInfoGPT: an LLM-based two-stage framework for reliability assessment of rotating machine under partial information[J]","volume":"250","author":"Pang","year":"2024","journal-title":"Reliab. Eng. Syst. Saf."},{"key":"10.1016\/j.aei.2026.104726_b0105","doi-asserted-by":"crossref","DOI":"10.1016\/j.aei.2025.103208","article-title":"FD-LLM: Large language model for fault diagnosis of complex equipment[J]","volume":"65","author":"Lin","year":"2025","journal-title":"Adv. Eng. Inf."},{"key":"10.1016\/j.aei.2026.104726_b0110","article-title":"WamGLM: a multimodal large-scale language model for wafer map defect information in-depth query through multi-turn dialogue based on prototypical supervised contrastive learning[J]","volume":"113962","author":"Gu","year":"2025","journal-title":"Appl. Soft Comput."},{"key":"10.1016\/j.aei.2026.104726_b0115","unstructured":"Chen J, Huang R, Lv Z, et al. Faultgpt: Industrial fault diagnosis question answering system by vision language models[J]. arXiv preprint arXiv:2502.15481, 2025."},{"key":"10.1016\/j.aei.2026.104726_b0120","doi-asserted-by":"crossref","unstructured":"Li Q, Zhang X, Huang J, et al. VSLLaVA: a pipeline of large multimodal foundation model for industrial vibration signal analysis[J]. arXiv preprint arXiv:2409.07482, 2024.","DOI":"10.2139\/ssrn.5006359"},{"key":"10.1016\/j.aei.2026.104726_b0260","doi-asserted-by":"crossref","DOI":"10.1016\/j.aei.2025.103156","article-title":"Transparent information fusion network: an explainable network for multi-source bearing fault diagnosis via self-organized neural-symbolic nodes[J]","volume":"65","author":"Li","year":"2025","journal-title":"Adv. Eng. Inf."},{"key":"10.1016\/j.aei.2026.104726_b0125","doi-asserted-by":"crossref","DOI":"10.1016\/j.ymssp.2023.110491","article-title":"Prior knowledge-embedded meta-transfer learning for few-shot fault diagnosis under variable operating conditions[J]","volume":"200","author":"Lei","year":"2023","journal-title":"Mech. Syst. Sig. Process."},{"key":"10.1016\/j.aei.2026.104726_b0130","doi-asserted-by":"crossref","DOI":"10.1016\/j.measurement.2021.110460","article-title":"Autoencoder-based representation learning and its application in intelligent fault diagnosis: a review[J]","volume":"189","author":"Yang","year":"2022","journal-title":"Measurement"},{"key":"10.1016\/j.aei.2026.104726_b0135","doi-asserted-by":"crossref","DOI":"10.1016\/j.engappai.2025.111954","article-title":"Sharpness-aware multidomain imbalance generalization with external adversarial learning and intrinsic balanced entropy regularization for intelligent fault diagnosis[J]","volume":"160","author":"Deng","year":"2025","journal-title":"Eng. Appl. Artif. Intel."},{"issue":"13","key":"10.1016\/j.aei.2026.104726_b0140","doi-asserted-by":"crossref","first-page":"23110","DOI":"10.1109\/JIOT.2024.3387741","article-title":"Knowledge distillation-guided cost-sensitive ensemble learning framework for imbalanced fault diagnosis[J]","volume":"11","author":"Deng","year":"2024","journal-title":"IEEE Internet Things J."},{"key":"10.1016\/j.aei.2026.104726_b0145","doi-asserted-by":"crossref","DOI":"10.1016\/j.engappai.2026.114336","article-title":"Lightweight cost-sensitive multi-expert dual knowledge transfer network for imbalanced fault diagnosis[J]","volume":"173","author":"Deng","year":"2026","journal-title":"Eng. Appl. Artif. Intel."},{"issue":"19","key":"10.1016\/j.aei.2026.104726_b0150","doi-asserted-by":"crossref","first-page":"31422","DOI":"10.1109\/JIOT.2024.3418352","article-title":"Online fault diagnosis of industrial robot using IoRT and hybrid deep learning techniques: an experimental approach[J]","volume":"11","author":"Bilal","year":"2024","journal-title":"IEEE Internet Things J."},{"key":"10.1016\/j.aei.2026.104726_b0155","doi-asserted-by":"crossref","DOI":"10.1016\/j.ymssp.2021.108653","article-title":"The emerging graph neural networks for intelligent fault diagnostics and prognostics: a guideline and a benchmark study[J]","volume":"168","author":"Li","year":"2022","journal-title":"Mech. Syst. Sig. Process."},{"key":"10.1016\/j.aei.2026.104726_b0160","doi-asserted-by":"crossref","first-page":"603","DOI":"10.1016\/j.jare.2025.02.029","article-title":"Digital twin-driven operational CycleGAN-based multiple virtual-physical mappings for remaining useful life prediction under limited life cycle data[J]","volume":"70","author":"Xu","year":"2025","journal-title":"J. Adv. Res."},{"key":"10.1016\/j.aei.2026.104726_b0165","article-title":"Virtual-physical mapping network-driven digital twin for intelligent fault diagnosis with imbalanced samples[J]","volume":"111783","author":"Xu","year":"2025","journal-title":"Comput. Ind. Eng."},{"key":"10.1016\/j.aei.2026.104726_b0170","doi-asserted-by":"crossref","first-page":"593","DOI":"10.1016\/j.jmsy.2026.02.008","article-title":"Leveraging large language models for smart manufacturing: Reviews, enablers, challenges, and opportunities[J]","volume":"85","author":"Chen","year":"2026","journal-title":"J. Manuf. Syst."},{"key":"10.1016\/j.aei.2026.104726_b0175","doi-asserted-by":"crossref","DOI":"10.1016\/j.eswa.2024.125861","article-title":"LLM-TSFD: an industrial time series human-in-the-loop fault diagnosis method based on a large language model[J]","volume":"264","author":"Zhang","year":"2025","journal-title":"Expert Syst. Appl."},{"key":"10.1016\/j.aei.2026.104726_b0180","article-title":"DT and LLM Driven Intelligent Maintenance System for L-DED and DAG-Based LLM Fault Diagnosis Evaluation Framework[J]","volume":"113942","author":"Tang","year":"2025","journal-title":"Appl. Soft Comput."},{"issue":"4","key":"10.1016\/j.aei.2026.104726_b0185","doi-asserted-by":"crossref","first-page":"2302","DOI":"10.1109\/TSMC.2020.3048950","article-title":"WaveletKernelNet: an interpretable deep neural network for industrial intelligent diagnosis[J]","volume":"52","author":"Li","year":"2021","journal-title":"IEEE Transactions on Systems, Man, and Cybernetics: Systems"},{"key":"10.1016\/j.aei.2026.104726_b0190","doi-asserted-by":"crossref","first-page":"20","DOI":"10.1016\/j.jmsy.2023.05.027","article-title":"Multilayer Grad-CAM: an effective tool towards explainable deep neural networks for intelligent fault diagnosis[J]","volume":"69","author":"Li","year":"2023","journal-title":"J. Manuf. Syst."},{"key":"10.1016\/j.aei.2026.104726_b0195","first-page":"8182","article-title":"Lvlm-intrepret: an interpretability tool for large vision-language models[C]\/\/Proceedings of the IEEE\/CVF","author":"Ben Melech Stan","year":"2024","journal-title":"Conference on Computer Vision and Pattern Recognition."},{"key":"10.1016\/j.aei.2026.104726_b0200","unstructured":"Ito M, Tanaka K, Matsuda K, et al. XDR-LVLM: An Explainable Vision-Language Large Model for Diabetic Retinopathy Diagnosis[J]. arXiv preprint arXiv:2508.15168, 2025."},{"key":"10.1016\/j.aei.2026.104726_b0205","doi-asserted-by":"crossref","DOI":"10.1016\/j.ress.2024.110382","article-title":"Empirical study on fine-tuning pre-trained large language models for fault diagnosis of complex systems[J]","volume":"252","author":"Zheng","year":"2024","journal-title":"Reliab. Eng. Syst. Saf."},{"issue":"2","key":"10.1016\/j.aei.2026.104726_b0210","first-page":"3","article-title":"Lora: Low-rank adaptation of large language models[J]","volume":"1","author":"Hu","year":"2022","journal-title":"ICLR"},{"key":"10.1016\/j.aei.2026.104726_b0215","first-page":"34892","article-title":"Visual instruction tuning[J]","volume":"36","author":"Liu","year":"2023","journal-title":"Adv. Neural Inf. Proces. Syst."},{"issue":"12","key":"10.1016\/j.aei.2026.104726_b0220","doi-asserted-by":"crossref","first-page":"14114","DOI":"10.1109\/TII.2024.3441638","article-title":"Large-scale visual language model boosted by contrast domain adaptation for intelligent industrial visual monitoring[J]","volume":"20","author":"Wang","year":"2024","journal-title":"IEEE Trans. Ind. Inf."},{"key":"10.1016\/j.aei.2026.104726_b0225","unstructured":"Touvron H, Lavril T, Izacard G, et al. Llama: Open and efficient foundation language models[J]. arXiv preprint arXiv:2302.13971, 2023."},{"key":"10.1016\/j.aei.2026.104726_b0230","first-page":"21406","author":"Aflalo","year":"2022","journal-title":"Vl-Interpret: an Interactive Visualization Tool for Interpreting Vision-Language Transformers[c]\/\/proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition."},{"key":"10.1016\/j.aei.2026.104726_b0235","doi-asserted-by":"crossref","DOI":"10.1016\/j.ress.2024.110684","article-title":"Unsupervised graph transfer network with hybrid attention mechanism for fault diagnosis under variable operating conditions[J]","volume":"255","author":"Lei","year":"2025","journal-title":"Reliab. Eng. Syst. Saf."},{"issue":"4","key":"10.1016\/j.aei.2026.104726_b0240","doi-asserted-by":"crossref","DOI":"10.1088\/1361-6501\/adbc0d","article-title":"A patch-interactive enhancement network for semiconductor wafer map mixed defect recognition with a two-stage training strategy[J]","volume":"36","author":"Gu","year":"2025","journal-title":"Meas. Sci. Technol."},{"key":"10.1016\/j.aei.2026.104726_b0245","first-page":"397","author":"Chefer","year":"2021","journal-title":"Generic Attention-Model Explainability for Interpreting Bi-Modal and Encoder-Decoder Transformers[c]\/\/proceedings of the IEEE\/CVF International Conference on Computer Vision."},{"key":"10.1016\/j.aei.2026.104726_b0250","doi-asserted-by":"crossref","DOI":"10.1016\/j.dib.2023.109987","article-title":"Motor current and vibration monitoring dataset for various faults in an E-motor-driven centrifugal pump[J]","volume":"52","author":"Bruinsma","year":"2024","journal-title":"Data Brief"},{"key":"10.1016\/j.aei.2026.104726_b0255","unstructured":"Chen B, Zheng Z, Yang L, et al. Seeing It or Not? Interpretable Vision-aware Latent Steering to Mitigate Object Hallucinations[J]. arXiv preprint arXiv:2505.17812, 2025."}],"container-title":["Advanced Engineering Informatics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1474034626004180?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S1474034626004180?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2026,5,15]],"date-time":"2026-05-15T03:35:46Z","timestamp":1778816146000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S1474034626004180"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,9]]},"references-count":52,"alternative-id":["S1474034626004180"],"URL":"https:\/\/doi.org\/10.1016\/j.aei.2026.104726","relation":{},"ISSN":["1474-0346"],"issn-type":[{"value":"1474-0346","type":"print"}],"subject":[],"published":{"date-parts":[[2026,9]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"XFD-LVLM: An explainable multimodal framework for aviation hydraulic pump intelligent fault diagnosis with large Vision-Language models","name":"articletitle","label":"Article Title"},{"value":"Advanced Engineering Informatics","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.aei.2026.104726","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2026 Elsevier Ltd. All rights are reserved, including those for text and data mining, AI training, and similar technologies.","name":"copyright","label":"Copyright"}],"article-number":"104726"}}