{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,16]],"date-time":"2026-06-16T06:55:58Z","timestamp":1781592958475,"version":"3.54.5"},"reference-count":30,"publisher":"Elsevier BV","license":[{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/tdm\/userlicense\/1.0\/"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.elsevier.com\/legal\/tdmrep-license"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-017"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-012"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,9,1]],"date-time":"2026-09-01T00:00:00Z","timestamp":1788220800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-004"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["elsevier.com","sciencedirect.com"],"crossmark-restriction":true},"short-container-title":["Engineering Applications of Artificial Intelligence"],"published-print":{"date-parts":[[2026,9]]},"DOI":"10.1016\/j.engappai.2026.115180","type":"journal-article","created":{"date-parts":[[2026,5,28]],"date-time":"2026-05-28T09:05:41Z","timestamp":1779959141000},"page":"115180","update-policy":"https:\/\/doi.org\/10.1016\/elsevier_cm_policy","source":"Crossref","is-referenced-by-count":0,"special_numbering":"P1","title":["EnhanceIT: Enhancing instruction tuning of large language models with selective quality and diversity instruction data"],"prefix":"10.1016","volume":"179","author":[{"ORCID":"https:\/\/orcid.org\/0009-0000-7750-1629","authenticated-orcid":false,"given":"Qiang","family":"Huang","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Feng","family":"Huang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Dehao","family":"Tao","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Dejing","family":"Dou","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Yongfeng","family":"Huang","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"78","reference":[{"key":"10.1016\/j.engappai.2026.115180_b1","series-title":"GPT-4 technical report","author":"Achiam","year":"2023"},{"key":"10.1016\/j.engappai.2026.115180_b2","series-title":"Qwen technical report","author":"Bai","year":"2023"},{"key":"10.1016\/j.engappai.2026.115180_b3","series-title":"Instruction mining: When data mining meets large language model finetuning","author":"Cao","year":"2023"},{"key":"10.1016\/j.engappai.2026.115180_b4","series-title":"A survey on evaluation of large language models","author":"Chang","year":"2023"},{"key":"10.1016\/j.engappai.2026.115180_b5","series-title":"AlpaGasus: Training a better alpaca with fewer data","author":"Chen","year":"2023"},{"key":"10.1016\/j.engappai.2026.115180_b6","series-title":"AlpaGasus: Training a better alpaca with fewer data","author":"Chen","year":"2024"},{"key":"10.1016\/j.engappai.2026.115180_b7","series-title":"Vicuna: An open-source chatbot impressing GPT-4 with 90%* ChatGPT quality","author":"Chiang","year":"2023"},{"key":"10.1016\/j.engappai.2026.115180_b8","doi-asserted-by":"crossref","first-page":"454","DOI":"10.1162\/tacl_a_00317","article-title":"TyDi QA: A Benchmark for Information-Seeking Question Answering in Typologically Diverse Languages","volume":"8","author":"Clark","year":"2020","journal-title":"Trans. Assoc. Comput. Linguist."},{"key":"10.1016\/j.engappai.2026.115180_b9","series-title":"Training verifiers to solve math word problems","author":"Cobbe","year":"2021"},{"key":"10.1016\/j.engappai.2026.115180_b10","series-title":"Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing","first-page":"3029","article-title":"Enhancing chat language models by scaling high-quality instructional conversations","author":"Ding","year":"2023"},{"key":"10.1016\/j.engappai.2026.115180_b11","series-title":"Advances in Neural Information Processing Systems","first-page":"30039","article-title":"AlpacaFarm: A simulation framework for methods that learn from human feedback","volume":"36","author":"Dubois","year":"2023"},{"key":"10.1016\/j.engappai.2026.115180_b12","article-title":"A survey on llm-as-a-judge","author":"Gu","year":"2024","journal-title":"Innov."},{"key":"10.1016\/j.engappai.2026.115180_b13","series-title":"Proceedings of the Annual Meeting of the Cognitive Science Society","article-title":"Unifit: A unified framework for instruction tuning to improve instruction following ability for large language models","author":"Huang","year":"2024"},{"key":"10.1016\/j.engappai.2026.115180_b14","series-title":"Mistral 7B","author":"Jiang","year":"2023"},{"key":"10.1016\/j.engappai.2026.115180_b15","series-title":"From quantity to quality: Boosting LLM performance with self-guided data selection for instruction tuning","author":"Li","year":"2023"},{"key":"10.1016\/j.engappai.2026.115180_b16","series-title":"SelectIT: Selective instruction tuning for large language models via uncertainty-aware self-reflection","author":"Liu","year":"2024"},{"key":"10.1016\/j.engappai.2026.115180_b17","series-title":"NeurIPS","article-title":"Training language models to follow instructions with human feedback","author":"Ouyang","year":"2022"},{"key":"10.1016\/j.engappai.2026.115180_b18","series-title":"Instruction tuning with GPT-4","author":"Peng","year":"2023"},{"key":"10.1016\/j.engappai.2026.115180_b19","series-title":"ToolLLM: Facilitating large language models to master 16000+ real-world APIs","author":"Qin","year":"2023"},{"key":"10.1016\/j.engappai.2026.115180_b20","series-title":"Annual Meeting of the Association for Computational Linguistics","article-title":"Challenging BIG-bench tasks and whether chain-of-thought can solve them","author":"Suzgun","year":"2022"},{"key":"10.1016\/j.engappai.2026.115180_b21","series-title":"Llama 2: Open foundation and fine-tuned chat models","author":"Touvron","year":"2023"},{"key":"10.1016\/j.engappai.2026.115180_b22","series-title":"Annual Meeting of the Association for Computational Linguistics","article-title":"Self-instruct: Aligning language models with self-generated instructions","author":"Wang","year":"2022"},{"key":"10.1016\/j.engappai.2026.115180_b23","series-title":"The Tenth International Conference on Learning Representations, ICLR 2022, Virtual Event, April 25-29, 2022","article-title":"Finetuned language models are zero-shot learners","author":"Wei","year":"2022"},{"key":"10.1016\/j.engappai.2026.115180_b24","series-title":"Advances in Neural Information Processing Systems","first-page":"24824","article-title":"Chain-of-thought prompting elicits reasoning in large language models","volume":"35","author":"Wei","year":"2022"},{"key":"10.1016\/j.engappai.2026.115180_b25","series-title":"AAPO: enhancing the reasoning capabilities of LLMs with advantage momentum","author":"Xiong","year":"2025"},{"key":"10.1016\/j.engappai.2026.115180_b26","series-title":"WizardLM: Empowering large language models to follow complex instructions","author":"Xu","year":"2023"},{"key":"10.1016\/j.engappai.2026.115180_b27","series-title":"Baichuan 2: Open large-scale language models","author":"Yang","year":"2023"},{"key":"10.1016\/j.engappai.2026.115180_b28","series-title":"Resolving knowledge conflicts in domain-specific data selection: A case study on medical instruction-tuning","author":"Zhong","year":"2025"},{"key":"10.1016\/j.engappai.2026.115180_b29","series-title":"LIMA: Less is more for alignment","author":"Zhou","year":"2023"},{"key":"10.1016\/j.engappai.2026.115180_b30","series-title":"CCF International Conference on Natural Language Processing and Chinese Computing","first-page":"229","article-title":"Bread: A hybrid approach for instruction data mining through balanced retrieval and dynamic data sampling","author":"Zhuang","year":"2024"}],"container-title":["Engineering Applications of Artificial Intelligence"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0952197626014648?httpAccept=text\/xml","content-type":"text\/xml","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/api.elsevier.com\/content\/article\/PII:S0952197626014648?httpAccept=text\/plain","content-type":"text\/plain","content-version":"vor","intended-application":"text-mining"}],"deposited":{"date-parts":[[2026,6,16]],"date-time":"2026-06-16T06:46:22Z","timestamp":1781592382000},"score":1,"resource":{"primary":{"URL":"https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0952197626014648"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,9]]},"references-count":30,"alternative-id":["S0952197626014648"],"URL":"https:\/\/doi.org\/10.1016\/j.engappai.2026.115180","relation":{},"ISSN":["0952-1976"],"issn-type":[{"value":"0952-1976","type":"print"}],"subject":[],"published":{"date-parts":[[2026,9]]},"assertion":[{"value":"Elsevier","name":"publisher","label":"This article is maintained by"},{"value":"EnhanceIT: Enhancing instruction tuning of large language models with selective quality and diversity instruction data","name":"articletitle","label":"Article Title"},{"value":"Engineering Applications of Artificial Intelligence","name":"journaltitle","label":"Journal Title"},{"value":"https:\/\/doi.org\/10.1016\/j.engappai.2026.115180","name":"articlelink","label":"CrossRef DOI link to publisher maintained version"},{"value":"article","name":"content_type","label":"Content Type"},{"value":"\u00a9 2026 Elsevier Ltd. All rights are reserved, including those for text and data mining, AI training, and similar technologies.","name":"copyright","label":"Copyright"}],"article-number":"115180"}}