{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,4]],"date-time":"2026-05-04T10:04:21Z","timestamp":1777889061568,"version":"3.51.4"},"reference-count":50,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T00:00:00Z","timestamp":1760832000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,10,19]],"date-time":"2025-10-19T00:00:00Z","timestamp":1760832000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,10,19]]},"DOI":"10.1109\/iccv51701.2025.01572","type":"proceedings-article","created":{"date-parts":[[2026,4,29]],"date-time":"2026-04-29T19:45:49Z","timestamp":1777491949000},"page":"16927-16937","source":"Crossref","is-referenced-by-count":0,"title":["Scendi Score: Prompt-Aware Diversity Evaluation Via Schur Complement of Clip Embeddings"],"prefix":"10.1109","author":[{"given":"Azim","family":"Ospanov","sequence":"first","affiliation":[{"name":"&#x002A;The Chinese University of Hong Kong,Department of Computer Science &#x0026; Engineering"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mohammad","family":"Jalali","sequence":"additional","affiliation":[{"name":"&#x002A;The Chinese University of Hong Kong,Department of Computer Science &#x0026; Engineering"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Farzan","family":"Farnia","sequence":"additional","affiliation":[{"name":"&#x002A;The Chinese University of Hong Kong,Department of Computer Science &#x0026; Engineering"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","volume-title":"Consistency-diversity-realism pareto fronts of conditional image generative models","author":"Astolfi","year":"2024"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.52202\/079017-2678"},{"key":"ref3","article-title":"Demystifying mmd gans","author":"Bi\u0144kowski","year":"2018","journal-title":"arXiv preprint"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.52202\/075280-1102"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00084"},{"key":"ref6","volume-title":"Deepseek-v3 technical report","year":"2024"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"ref8","volume-title":"On the evaluation of conditional gans","author":"Terrance","year":"2019"},{"key":"ref9","article-title":"The vendi score: A diversity evaluation metric for machine learning","author":"Friedman","year":"2023","journal-title":"Transactions on machine learning research"},{"key":"ref10","article-title":"Interpreting CLIP\u2019s image representation via text-based decomposition","volume-title":"The Twelfth International Conference on Learning Representations","author":"Gandelsman"},{"key":"ref11","article-title":"Boosting the visual interpretability of clip via adversarial fine-tuning","volume-title":"The Thirteenth International Conference on Learning Representations","author":"Gong"},{"key":"ref12","article-title":"Kernel-based unsupervised embedding alignment for enhanced visual representation in vision-language models","author":"Gong","year":"2025","journal-title":"arXiv preprint"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-73021-4_13"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.emnlp-main.595"},{"key":"ref15","article-title":"Gans trained by a two time-scale update rule converge to a local nash equilibrium","volume":"30","author":"Heusel","year":"2017","journal-title":"Advances in neural information processing systems"},{"key":"ref16","volume-title":"A multiarmed bandit approach to online selection and evaluation of generative models","author":"Hu","year":"2025"},{"key":"ref17","article-title":"An online learning approach to prompt-based selection of generative models and 11 ms","volume-title":"Forty-second International Conference on Machine Learning","author":"Hu"},{"key":"ref18","volume-title":"Promptwise: Online learning for cost-aware prompt assignment in generative models","author":"Hu","year":"2025"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.52202\/075280-0434"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/iccvw69036.2025.00791"},{"key":"ref21","article-title":"Sparke: Scalable prompt-aware diversity guidance in diffusion models via rke score","author":"Jalali","year":"2025","journal-title":"arXiv preprint"},{"key":"ref22","article-title":"Towards an explainable comparison and alignment of feature embeddings","author":"Jalali","year":"2025","journal-title":"arXiv preprint"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.215"},{"key":"ref24","volume-title":"Beyond aesthetics: Cultural competence in text-to-image models","author":"Kannen","year":"2024"},{"key":"ref25","article-title":"Attribute based interpretable evaluation metrics for generative models","volume-title":"Forty-first International Conference on Machine Learning","author":"Kim"},{"key":"ref26","article-title":"Improved precision and recall metric for assessing generative models","volume":"32","author":"Kynk\u00e4\u00e4nniemi","year":"2019","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref27","volume-title":"Flux: A diffusion-based text-to-image (t2i) model.","year":"2024"},{"key":"ref28","article-title":"Holistic evaluation of text-to-image models","volume-title":"Thirtyseventh Conference on Neural Information Processing Systems Datasets and Benchmarks Track","author":"Lee"},{"key":"ref29","article-title":"Language-biased image classification: evaluation based on semantic representations","volume-title":"International Conference on Learning Representations","author":"Lemesle"},{"key":"ref30","article-title":"The double-ellipsoid geometry of CLIP","volume-title":"Forty-second International Conference on Machine Learning","author":"Levi"},{"key":"ref31","article-title":"Holistic evaluation of language models","author":"Liang","journal-title":"Transactions on Machine Learning Research, 2023. Featured Certification, Expert Certification."},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01592"},{"key":"ref33","first-page":"7","volume-title":"Idenprof: A pre-trained deep learning model for identifying professionals in images, 2018.","author":"Moses","year":"2025"},{"key":"ref34","first-page":"7176","article-title":"Reliable fidelity and diversity metrics for generative models","volume-title":"International Conference on Machine Learning","author":"Naeem"},{"issue":"7","key":"ref35","volume-title":"Dalle 3","volume":"2","year":"2023"},{"key":"ref36","article-title":"Do vendi scores converge with finite samples? truncated vendi score for finitesample convergence guarantees","volume-title":"The 41st Conference on Uncertainty in Artificial Intelligence","author":"Ospanov"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.52202\/079017-3841"},{"key":"ref38","article-title":"Cousins of the vendi score: A family of similarity-based diversity metrics for science and machine learning","volume-title":"International Conference on Artificial Intelligence and Statistics.","author":"Pasarkar"},{"key":"ref39","article-title":"SDXL: Improving latent diffusion models for high-resolution image synthesis","volume-title":"The Twelfth International Conference on Learning Representations","author":"Podell"},{"key":"ref40","first-page":"8748","article-title":"Learning transferable visual models from natural language supervision","volume-title":"Proceedings of the 38th International Conference on Machine Learning","volume":"2","author":"Radford"},{"key":"ref41","first-page":"4","article-title":"Random features for largescale kernel machines","volume":"20","author":"Rahimi","year":"2007","journal-title":"Advances in neural information processing systems"},{"key":"ref42","volume-title":"Be more diverse than the most diverse: Optimal mixtures of generative models via mixture-ucb bandit algorithms","author":"Rezaei","year":"2025"},{"key":"ref43","article-title":"Assessing generative models via precision and recall","volume":"31","author":"Sajjadi","year":"2018","journal-title":"Advances in neural information processing systems"},{"key":"ref44","article-title":"Improved techniques for training GANs","author":"Salimans","year":"2016","journal-title":"Advances in Neural Information Processing Systems. Curran Associates, Inc."},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.74"},{"key":"ref46","article-title":"Axiomatic attribution for deep networks","author":"Sundararajan","year":"2017","journal-title":"CoRR, abs\/1703.01365"},{"key":"ref47","article-title":"On the distributed evaluation of generative models","author":"Wang","year":"2023","journal-title":"arXiv preprint"},{"key":"ref48","article-title":"An interpretable evaluation of entropy-based novelty of generative models","author":"Zhang","year":"2024","journal-title":"arXiv preprint"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52734.2025.00774"},{"key":"ref50","article-title":"Qwen3 embedding: Advancing text embedding and reranking through foundation models","author":"Zhang","year":"2025","journal-title":"arXiv preprint"}],"event":{"name":"2025 IEEE\/CVF International Conference on Computer Vision (ICCV)","location":"Honolulu, HI, USA","start":{"date-parts":[[2025,10,19]]},"end":{"date-parts":[[2025,10,25]]}},"container-title":["2025 IEEE\/CVF International Conference on Computer Vision (ICCV)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11443115\/11443287\/11444410.pdf?arnumber=11444410","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T05:06:07Z","timestamp":1777611967000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11444410\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,19]]},"references-count":50,"URL":"https:\/\/doi.org\/10.1109\/iccv51701.2025.01572","relation":{},"subject":[],"published":{"date-parts":[[2025,10,19]]}}}