{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T17:46:12Z","timestamp":1777657572789,"version":"3.51.4"},"publisher-location":"Cham","reference-count":51,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031730207","type":"print"},{"value":"9783031730214","type":"electronic"}],"license":[{"start":{"date-parts":[[2024,11,21]],"date-time":"2024-11-21T00:00:00Z","timestamp":1732147200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,11,21]],"date-time":"2024-11-21T00:00:00Z","timestamp":1732147200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-73021-4_13","type":"book-chapter","created":{"date-parts":[[2024,11,20]],"date-time":"2024-11-20T09:18:48Z","timestamp":1732094328000},"page":"213-229","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["Improving Geo-Diversity of\u00a0Generated Images with\u00a0Contextualized Vendi Score Guidance"],"prefix":"10.1007","author":[{"given":"Reyhane","family":"Askari Hemmat","sequence":"first","affiliation":[]},{"given":"Melissa","family":"Hall","sequence":"additional","affiliation":[]},{"given":"Alicia","family":"Sun","sequence":"additional","affiliation":[]},{"given":"Candace","family":"Ross","sequence":"additional","affiliation":[]},{"given":"Michal","family":"Drozdzal","sequence":"additional","affiliation":[]},{"given":"Adriana","family":"Romero-Soriano","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,11,21]]},"reference":[{"key":"13_CR1","doi-asserted-by":"crossref","unstructured":"Bansal, H., Yin, D., Monajatipoor, M., Chang, K.W.: How well can text-to-image generative models understand ethical natural language interventions? In: EMNLP (Short) (2022)","DOI":"10.18653\/v1\/2022.emnlp-main.88"},{"key":"13_CR2","doi-asserted-by":"crossref","unstructured":"Basu, A., Babu, R.V., Pruthi, D.: Inspecting the geographical representativeness of images from text-to-image models. arXiv preprint arXiv:2305.11080 (2023)","DOI":"10.1109\/ICCV51070.2023.00474"},{"key":"13_CR3","unstructured":"Berns, S., Colton, S., Guckelsberger, C.: Towards mode balancing of generative models via diversity weights (2023)"},{"key":"13_CR4","doi-asserted-by":"crossref","unstructured":"Bianchi, F., et al.: Easily accessible text-to-image generation amplifies demographic stereotypes at large scale (2022)","DOI":"10.1145\/3593013.3594095"},{"key":"13_CR5","unstructured":"Bolukbasi, T., Chang, K.W., Zou, J.Y., Saligrama, V., Kalai, A.T.: Man is to computer programmer as woman is to homemaker? Debiasing word embeddings. In: Advances in Neural Information Processing Systems, vol. 29 (2016)"},{"key":"13_CR6","unstructured":"Brack, M., Friedrich, F., Hintersdorf, D., Struppek, L., Schramowski, P., Kersting, K.: SEGA: instructing text-to-image models using semantic guidance (2023)"},{"key":"13_CR7","unstructured":"Brack, M., Friedrich, F., Schramowski, P., Kersting, K.: Mitigating inappropriateness in image generation: can there be value in reflecting the world\u2019s ugliness? arXiv preprint arXiv:2305.18398 (2023)"},{"key":"13_CR8","doi-asserted-by":"crossref","unstructured":"Cho, J., Zala, A., Bansal, M.: DALL-Eval: probing the reasoning skills and social biases of text-to-image generative transformers (2022)","DOI":"10.1109\/ICCV51070.2023.00283"},{"key":"13_CR9","unstructured":"Chuang, C.Y., Jampani, V., Li, Y., Torralba, A., Jegelka, S.: Debiasing vision-language models via biased prompts. arXiv preprint arXiv:2302.00070 (2023)"},{"key":"13_CR10","doi-asserted-by":"crossref","unstructured":"Clemmer, C., Ding, J., Feng, Y.: PreciseDebias: an automatic prompt engineering approach for generative AI to mitigate image demographic biases. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, pp. 8596\u20138605 (2024)","DOI":"10.1109\/WACV57701.2024.00840"},{"key":"13_CR11","doi-asserted-by":"publisher","unstructured":"Deng, J., Dong, W., Socher, R., Li, L.J., Li, K., Fei-Fei, L.: ImageNet: a large-scale hierarchical image database. In: 2009 IEEE Conference on Computer Vision and Pattern Recognition, pp. 248\u2013255 (2009). https:\/\/doi.org\/10.1109\/CVPR.2009.5206848","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"13_CR12","unstructured":"Dhariwal, P., Nichol, A.: Diffusion models beat GANs on image synthesis. In: Advances in Neural Information Processing Systems, vol. 34, pp. 8780\u20138794 (2021)"},{"key":"13_CR13","unstructured":"Friedman, D., Dieng, A.B.: The vendi score: a diversity evaluation metric for machine learning. arXiv preprint arXiv:2210.02410 (2022)"},{"key":"13_CR14","doi-asserted-by":"crossref","unstructured":"Friedrich, F., et al.: Fair diffusion: instructing text-to-image generation models on fairness (2023)","DOI":"10.1007\/s43681-024-00531-5"},{"key":"13_CR15","doi-asserted-by":"publisher","first-page":"89","DOI":"10.1007\/978-3-031-19784-0_6","volume-title":"Computer Vision-ECCV 2022, Part XV","author":"O Gafni","year":"2022","unstructured":"Gafni, O., Polyak, A., Ashual, O., Sheynin, S., Parikh, D., Taigman, Y.: Make-a-scene: scene-based text-to-image generation with human priors. In: Avidan, S., Brostow, G., Ciss\u00e9, M., Farinella, G.M., Hassner, T. (eds.) ECCV 2022, Part XV. LNCS, vol. 13675, pp. 89\u2013106. Springer, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-031-19784-0_6"},{"key":"13_CR16","unstructured":"Gal, R., et al.: An image is worth one word: personalizing text-to-image generation using textual inversion. arXiv preprint arXiv:2208.01618 (2022)"},{"key":"13_CR17","doi-asserted-by":"crossref","unstructured":"Gandikota, R., Materzynska, J., Fiotto-Kaufman, J., Bau, D.: Erasing concepts from diffusion models. arXiv preprint arXiv:2303.07345 (2023)","DOI":"10.1109\/ICCV51070.2023.00230"},{"key":"13_CR18","unstructured":"Hall, M., Ross, C., Williams, A., Carion, N., Drozdzal, M., Soriano, A.R.: DIG in: evaluating disparities in image generations with indicators for geographic diversity (2023)"},{"key":"13_CR19","unstructured":"Hao, S., et al.: Harm amplification in text-to-image models (2024)"},{"key":"13_CR20","unstructured":"He, R., et al.: Is synthetic data from generative models ready for image recognition? arXiv preprint arXiv:2210.07574 (2023)"},{"key":"13_CR21","unstructured":"Hemmat, R.A., Pezeshki, M., Bordes, F., Drozdzal, M., Romero-Soriano, A.: Feedback-guided data synthesis for imbalanced classification (2023)"},{"key":"13_CR22","unstructured":"Heng, A., Soh, H.: Selective amnesia: a continual learning approach to forgetting in deep generative models. In: Advances in Neural Information Processing Systems, vol. 36 (2024)"},{"key":"13_CR23","doi-asserted-by":"crossref","unstructured":"Hessel, J., Holtzman, A., Forbes, M., Bras, R.L., Choi, Y.: CLIPscore: a reference-free evaluation metric for image captioning. arXiv preprint arXiv:2104.08718 (2021)","DOI":"10.18653\/v1\/2021.emnlp-main.595"},{"key":"13_CR24","unstructured":"Kim, E., Kim, S., Shin, C., Yoon, S.: De-stereotyping text-to-image models through prompt tuning (2023)"},{"key":"13_CR25","unstructured":"Kynk\u00e4\u00e4nniemi, T., Karras, T., Laine, S., Lehtinen, J., Aila, T.: Improved precision and recall metric for assessing generative models (2019)"},{"key":"13_CR26","unstructured":"Luccioni, A.S., Akiki, C., Mitchell, M., Jernite, Y.: Stable bias: analyzing societal representations in diffusion models (2023)"},{"key":"13_CR27","unstructured":"Ma\u00f1as, O., et al.: Improving text-to-image consistency via automatic prompt optimization (2024)"},{"key":"13_CR28","doi-asserted-by":"crossref","unstructured":"Miller, G.A.: WordNet: a lexical database for English. In: Human Language Technology: Proceedings of a Workshop held at Plainsboro, New Jersey, 8\u201311 March 1994 (1994). https:\/\/aclanthology.org\/H94-1111","DOI":"10.3115\/1075812.1075938"},{"key":"13_CR29","unstructured":"Naeem, M.F., Oh, S.J., Uh, Y., Choi, Y., Yoo, J.: Reliable fidelity and diversity metrics for generative models. In: International Conference on Machine Learning, pp. 7176\u20137185. PMLR (2020)"},{"key":"13_CR30","doi-asserted-by":"crossref","unstructured":"Naik, R., Nushi, B.: Social biases through the text-to-image generation lens (2023)","DOI":"10.1145\/3600211.3604711"},{"key":"13_CR31","unstructured":"Nichol, A., et al.: GLIDE: towards photorealistic image generation and editing with text-guided diffusion models. CoRR abs\/2112.10741 (2021). https:\/\/arxiv.org\/abs\/2112.10741"},{"key":"13_CR32","doi-asserted-by":"crossref","unstructured":"Orgad, H., Kawar, B., Belinkov, Y.: Editing implicit assumptions in text-to-image diffusion models. arXiv preprint arXiv:2303.08084 (2023)","DOI":"10.1109\/ICCV51070.2023.00649"},{"key":"13_CR33","unstructured":"Radford, A., et\u00a0al.: Learning transferable visual models from natural language supervision. In: International Conference on Machine Learning, pp. 8748\u20138763. PMLR (2021)"},{"key":"13_CR34","unstructured":"Ramaswamy, V.V., et al.: Beyond web-scraping: crowd-sourcing a geodiverse dataset. arXiv preprint (2023)"},{"key":"13_CR35","unstructured":"Ramesh, A., Dhariwal, P., Nichol, A., Chu, C., Chen, M.: Hierarchical text-conditional image generation with CLIP latents (2022)"},{"key":"13_CR36","doi-asserted-by":"publisher","first-page":"426","DOI":"10.1007\/978-3-031-19784-0_25","volume-title":"European Conference on Computer Vision 2022","author":"H Rangwani","year":"2022","unstructured":"Rangwani, H., Jaswani, N., Karmali, T., Jampani, V., Babu, R.V.: Improving GANs for long-tailed data through group spectral regularization. In: Avidan, S., Brostow, G., Ciss\u00e9, M., Farinella, G.M., Hassner, T. (eds.) ECCV 2022. LNCS, vol. 13675, pp. 426\u2013442. Springer, Cham (2022). https:\/\/doi.org\/10.1007\/978-3-031-19784-0_25"},{"key":"13_CR37","unstructured":"Rojas, W.A.G., Diamos, S., Kini, K.R., Kanter, D., Reddi, V.J., Coleman, C.: The dollar street dataset: images representing the geographic and socioeconomic diversity of the world. In: Thirty-Sixth Conference on Neural Information Processing Systems Datasets and Benchmarks Track (2022)"},{"key":"13_CR38","unstructured":"Rombach, R., Blattmann, A., Lorenz, D., Esser, P., Ommer, B.: High-resolution image synthesis with latent diffusion models. CoRR abs\/2112.10752 (2021). https:\/\/arxiv.org\/abs\/2112.10752"},{"key":"13_CR39","unstructured":"Sajjadi, M.S.M., Bachem, O., Lu\u010di\u0107, M., Bousquet, O., Gelly, S.: Assessing generative models via precision and recall. In: Advances in Neural Information Processing Systems (NeurIPS) (2018)"},{"key":"13_CR40","unstructured":"Salimans, T., Ho, J.: Progressive distillation for fast sampling of diffusion models. arXiv preprint arXiv:2202.00512 (2022)"},{"key":"13_CR41","doi-asserted-by":"crossref","unstructured":"Schramowski, P., Brack, M., Deiseroth, B., Kersting, K.: Safe latent diffusion: mitigating inappropriate degeneration in diffusion models. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 22522\u201322531 (2023)","DOI":"10.1109\/CVPR52729.2023.02157"},{"key":"13_CR42","doi-asserted-by":"crossref","unstructured":"Sehwag, V., Hazirbas, C., Gordo, A., Ozgenel, F., Ferrer, C.C.: Generating high fidelity data from low-density regions using diffusion models (2022)","DOI":"10.1109\/CVPR52688.2022.01120"},{"key":"13_CR43","unstructured":"Shin, J., Kang, M., Park, J.: Fill-Up: balancing long-tailed data with generative models. arXiv preprint arXiv:2306.07200 (2023)"},{"key":"13_CR44","unstructured":"Song, J., Meng, C., Ermon, S.: Denoising diffusion implicit models. In: Proceedings of the International Conference on Learning Representations (ICLR) (2020)"},{"key":"13_CR45","unstructured":"Song, Y., Dhariwal, P., Chen, M., Sutskever, I.: Consistency models (2023)"},{"key":"13_CR46","doi-asserted-by":"crossref","unstructured":"Tanjim, M.M., Singh, K.K., Kafle, K., Sinha, R., Cottrell, G.W.: Discovering and mitigating biases in CLIP-based image editing. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, pp. 2984\u20132993 (2024)","DOI":"10.1109\/WACV57701.2024.00296"},{"key":"13_CR47","unstructured":"Touvron, H., et al.: LLaMA: open and efficient foundation language models (2023)"},{"key":"13_CR48","unstructured":"Wan, Y., Chang, K.W.: The male CEO and the female assistant: probing gender biases in text-to-image models through paired stereotype test (2024)"},{"key":"13_CR49","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"377","DOI":"10.1007\/978-3-030-58542-6_23","volume-title":"Computer Vision \u2013 ECCV 2020","author":"N Yu","year":"2020","unstructured":"Yu, N., Li, K., Zhou, P., Malik, J., Davis, L., Fritz, M.: Inclusive GAN: improving data and minority coverage in generative models. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020, Part XXII. LNCS, vol. 12367, pp. 377\u2013393. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58542-6_23"},{"key":"13_CR50","doi-asserted-by":"crossref","unstructured":"Zhang, C., et al.: ITI-GEN: inclusive text-to-image generation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, pp. 3969\u20133980 (2023)","DOI":"10.1109\/ICCV51070.2023.00367"},{"key":"13_CR51","doi-asserted-by":"crossref","unstructured":"Zhang, E., Wang, K., Xu, X., Wang, Z., Shi, H.: Forget-me-not: learning to forget in text-to-image diffusion models. arXiv preprint arXiv:2303.17591 (2023)","DOI":"10.1109\/CVPRW63382.2024.00182"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2024"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-73021-4_13","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,20]],"date-time":"2024-11-20T09:44:48Z","timestamp":1732095888000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-73021-4_13"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,21]]},"ISBN":["9783031730207","9783031730214"],"references-count":51,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-73021-4_13","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,11,21]]},"assertion":[{"value":"21 November 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Milan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2024.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}