{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T07:00:14Z","timestamp":1775199614865,"version":"3.50.1"},"reference-count":24,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,12,6]],"date-time":"2025-12-06T00:00:00Z","timestamp":1764979200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,12,6]],"date-time":"2025-12-06T00:00:00Z","timestamp":1764979200000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,12,6]]},"DOI":"10.1109\/asru65441.2025.11434610","type":"proceedings-article","created":{"date-parts":[[2026,4,2]],"date-time":"2026-04-02T19:48:04Z","timestamp":1775159284000},"page":"1-7","source":"Crossref","is-referenced-by-count":0,"title":["CLAIR\n                    <sub>A<\/sub>\n                    : Leveraging Large Language Models to Judge Audio Captions"],"prefix":"10.1109","author":[{"given":"Tsung-Han","family":"Wu","sequence":"first","affiliation":[{"name":"University of California Berkeley,Department of Electrical Engineering and Computer Science (EECS),Berkeley,CA,USA"}]},{"given":"Joseph E.","family":"Gonzalez","sequence":"additional","affiliation":[{"name":"University of California Berkeley,Department of Electrical Engineering and Computer Science (EECS),Berkeley,CA,USA"}]},{"given":"Trevor","family":"Darrell","sequence":"additional","affiliation":[{"name":"University of California Berkeley,Department of Electrical Engineering and Computer Science (EECS),Berkeley,CA,USA"}]},{"given":"David M.","family":"Chan","sequence":"additional","affiliation":[{"name":"University of California Berkeley,Department of Electrical Engineering and Computer Science (EECS),Berkeley,CA,USA"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/WASPAA.2017.8170058"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.3115\/1073083.1073135"},{"key":"ref3","first-page":"74","article-title":"ROUGE: A package for automatic evaluation of summaries","author":"Lin","year":"2004","journal-title":"Text Summarization Branches Out"},{"key":"ref4","first-page":"115","article-title":"Meteor, M-BLEU and M-TER: Evaluation metrics for high-correlation with human rankings of machine translation output","volume-title":"Proceedings of the Third Workshop on Statistical Machine Translation","author":"Agarwal"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7299087"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46454-1_24"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.100"},{"key":"ref8","article-title":"Bertscore: Evaluating text generation with BERT","volume-title":"8th International Conference on Learning Representations, ICLR 2020","author":"Zhang"},{"key":"ref9","first-page":"3982","article-title":"Sentence-BERT: Sentence embeddings using Siamese BERT-networks","volume-title":"Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (EMNLP-IJCNLP)","author":"Reimers"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP43922.2022.9746427"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10097021"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.23919\/EUSIPCO58844.2023.10289793"},{"key":"ref13","article-title":"Hello gpt-4o","year":"2024"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.findings-acl.729"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.emnlp-main.841"},{"key":"ref16","article-title":"Sparks of artificial general intelligence: Early experiments with gpt-4","author":"Bubeck","year":"2023","journal-title":"ArXiv preprint"},{"key":"ref17","article-title":"Qlora: Efficient finetuning of quantized 11 ms","author":"Dettmers","year":"2023","journal-title":"ArXiv preprint"},{"key":"ref18","article-title":"Vicuna: An open-source chatbot impressing gpt-4 with 90%* chatgpt quality","author":"Chiang","year":"2023"},{"key":"ref19","article-title":"Language models are few-shot learners","volume-title":"Advances in Neural Information Processing Systems 33: Annual Conference on Neural Information Processing Systems 2020, NeurIPS 2020","author":"Brown"},{"key":"ref20","article-title":"Efficient guided generation for 1 lms","author":"Willard","year":"2023","journal-title":"arXiv preprint arXiv:2307.09702"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP40776.2020.9052990"},{"key":"ref22","first-page":"119","article-title":"Audiocaps: Generating captions for audios in the wild","volume-title":"Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies","volume":"1","author":"Kim"},{"key":"ref23","article-title":"Gemini 1.5: Unlocking multimodal understanding across millions of tokens of context","author":"Team","year":"2024"},{"key":"ref24","article-title":"Phi-3 technical report: A highly capable language model locally on your phone","author":"Team","year":"2024"}],"event":{"name":"2025 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)","location":"Honolulu, HI, USA","start":{"date-parts":[[2025,12,6]]},"end":{"date-parts":[[2025,12,10]]}},"container-title":["2025 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11434577\/11433836\/11434610.pdf?arnumber=11434610","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T04:57:00Z","timestamp":1775192220000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11434610\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,12,6]]},"references-count":24,"URL":"https:\/\/doi.org\/10.1109\/asru65441.2025.11434610","relation":{},"subject":[],"published":{"date-parts":[[2025,12,6]]}}}