{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,27]],"date-time":"2025-09-27T00:12:23Z","timestamp":1758931943107,"version":"3.44.0"},"publisher-location":"Cham","reference-count":34,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783032061355","type":"print"},{"value":"9783032061362","type":"electronic"}],"license":[{"start":{"date-parts":[[2025,9,27]],"date-time":"2025-09-27T00:00:00Z","timestamp":1758931200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,9,27]],"date-time":"2025-09-27T00:00:00Z","timestamp":1758931200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026]]},"DOI":"10.1007\/978-3-032-06136-2_36","type":"book-chapter","created":{"date-parts":[[2025,9,26]],"date-time":"2025-09-26T18:38:04Z","timestamp":1758911884000},"page":"392-406","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Creating Datasets of\u00a0Moth Morphology and\u00a0Behaviour from\u00a0Textual Sources with\u00a0Large Language Models"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2181-0734","authenticated-orcid":false,"given":"Bartolome","family":"Ortiz-Viso","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5166-5510","authenticated-orcid":false,"given":"Jenna L.","family":"Lawson","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1116-3385","authenticated-orcid":false,"given":"Tom","family":"August","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,9,27]]},"reference":[{"key":"36_CR1","unstructured":"Acknowledgments $$|$$ Butterflies and Moths of North America. https:\/\/www.butterfliesandmoths.org\/acknowledgments"},{"key":"36_CR2","unstructured":"Butterflies and Moths of North America $$|$$ collecting and sharing data about Lepidoptera. https:\/\/www.butterfliesandmoths.org\/"},{"key":"36_CR3","unstructured":"Western Butterflies (Peterson Field Guide) by Opler, P.a.; Wright, A.b. https:\/\/www.pemberleybooks.com\/product\/western-butterflies-peterson-field-guide\/35828\/"},{"key":"36_CR4","unstructured":"Wikipedia, the free encyclopedia. https:\/\/www.wikipedia.org\/"},{"key":"36_CR5","unstructured":"Ball, L., Still, R., Riggs, A., Skilbeck, A., Shardlow, M., Whitehouse, A., Tinsley-Marshall, P.: The bugs matter citizen science survey (2021). https:\/\/cdn.buglife.org.uk\/2022\/05\/Bugs-Matter-2021-National-Report.pdf"},{"key":"36_CR6","unstructured":"Bert\u00a0Gustafsson, T.M.: Lepidoptera - Svenska fj\u00e4rilar - Naturhistoriska riksmuseet. http:\/\/www3.nrm.se\/en\/svenska_fjarilar\/svenska_fjarilar.html"},{"key":"36_CR7","unstructured":"Charles V\u00a0Covell, J.: A Field Guide to Moths of Eastern North America. https:\/\/www.nhbs.com\/a-field-guide-to-moths-of-eastern-north-america-book"},{"key":"36_CR8","unstructured":"Grattafiori, A., et\u00a0al.: The llama 3 herd of models (2024). https:\/\/arxiv.org\/abs\/2407.21783"},{"key":"36_CR9","doi-asserted-by":"publisher","unstructured":"Guo, R., et al.: A survey on advancements in image\u2013text multimodal models: from general techniques to biomedical implementations. Comput. Biol. Med. 178, 108709 (2024). https:\/\/doi.org\/10.1016\/j.compbiomed.2024.108709, https:\/\/linkinghub.elsevier.com\/retrieve\/pii\/S0010482524007947","DOI":"10.1016\/j.compbiomed.2024.108709"},{"key":"36_CR10","doi-asserted-by":"publisher","unstructured":"H\u00f8ye, T.T., et al.: Deep learning and computer vision will transform entomology. Proc. Natl. Acad. Sci. 118(2), e2002545117 (2021). https:\/\/doi.org\/10.1073\/pnas.2002545117, https:\/\/www.pnas.org\/doi\/full\/10.1073\/pnas.2002545117, publisher:Proceedings of the National Academy of Sciences","DOI":"10.1073\/pnas.2002545117"},{"key":"36_CR11","doi-asserted-by":"publisher","unstructured":"Jain, A., Cunha, F., Bunsen, M., Pasi, L., Viklund, A., Larriv\u00e9e, M., Rolnick, D.: A machine learning pipeline for automated insect monitoring, June 2024. https:\/\/doi.org\/10.48550\/arXiv.2406.13031, http:\/\/arxiv.org\/abs\/2406.13031, arXiv:2406.13031 [cs]","DOI":"10.48550\/arXiv.2406.13031"},{"key":"36_CR12","unstructured":"Kimber, I.: UKMoths $$|$$ Guide to the moths of Great Britain and Ireland. https:\/\/www.ukmoths.org.uk\/"},{"key":"36_CR13","doi-asserted-by":"publisher","unstructured":"van Klink, R., et al.: Emerging technologies revolutionise insect ecology and monitoring. Trends Ecol. Evol. 37(10), 872\u2013885 (2022). https:\/\/doi.org\/10.1016\/j.tree.2022.06.001, https:\/\/www.sciencedirect.com\/science\/article\/pii\/S0169534722001343","DOI":"10.1016\/j.tree.2022.06.001"},{"key":"36_CR14","doi-asserted-by":"publisher","unstructured":"Korsch, D., Bodesheim, P., Brehm, G., Denzler, J.: Automated Visual Monitoring of Nocturnal Insects with Light-based Camera Traps, July 2023. https:\/\/doi.org\/10.48550\/arXiv.2307.15433, http:\/\/arxiv.org\/abs\/2307.15433, arXiv:2307.15433 [cs]","DOI":"10.48550\/arXiv.2307.15433"},{"key":"36_CR15","doi-asserted-by":"publisher","unstructured":"L\u00f6bl, I., Klausnitzer, B., Hartmann, M., Krell, F.T.: The Silent Extinction of Species and Taxonomists\u2014An Appeal to Science Policymakers and Legislators. Diversity 15(10), \u00a01053 (2023). https:\/\/doi.org\/10.3390\/d15101053, https:\/\/www.mdpi.com\/1424-2818\/15\/10\/1053, number: 10 Publisher:Multidisciplinary Digital Publishing Institute","DOI":"10.3390\/d15101053"},{"key":"36_CR16","doi-asserted-by":"publisher","unstructured":"Meier, R., Hartop, E., Pylatiuk, C., Srivathsan, A.: Towards holistic insect monitoring: species discovery, description, identification and traits for all insects. Philosophical Trans. Roy. Soc. B: Biol. Sci. 379(1904), 20230120 (2024). https:\/\/doi.org\/10.1098\/rstb.2023.0120, https:\/\/royalsocietypublishing.org\/doi\/10.1098\/rstb.2023.0120,publisher: Royal Society","DOI":"10.1098\/rstb.2023.0120"},{"key":"36_CR17","unstructured":"Myers, P., Espinosa, R., Parr, C.S., Jones, T., Hammond, G.S., Dewey, T.A.: The animal diversity web (online) (2025). https:\/\/animaldiversity.org. Accessed 06 June 2025"},{"key":"36_CR18","unstructured":"OpenAI, et\u00a0al.: Gpt-4 technical report (2024). https:\/\/arxiv.org\/abs\/2303.08774"},{"key":"36_CR19","unstructured":"OpenAI, et\u00a0al.: Gpt-4o system card (2024). https:\/\/arxiv.org\/abs\/2410.21276"},{"key":"36_CR20","unstructured":"of\u00a0Ornithology, C.L.: Search, All About Birds, Cornell Lab of Ornithology. https:\/\/www.allaboutbirds.org\/guide\/search"},{"key":"36_CR21","doi-asserted-by":"publisher","unstructured":"Ortiz-Viso, B., Martin-Bautista, M.J.: \u201cLet It BEE\u201d: natural language classification of arthropod specimens based on their spanish description. In: Larsen, H.L., Martin-Bautista, M.J., Ruiz, M.D., Andreasen, T., Bordogna, G., De\u00a0Tr\u00e9, G. (eds.) Flexible Query Answering Systems, pp. 118\u2013128. LNCS, Springer, Cham (2023). https:\/\/doi.org\/10.1007\/978-3-031-42935-4_10","DOI":"10.1007\/978-3-031-42935-4_10"},{"key":"36_CR22","doi-asserted-by":"crossref","unstructured":"Powell, J.A., Opler, P.A.: Moths of Western North America. Univ of California Press (May 2009), google-Books-ID: USoWEQAAQBAJ","DOI":"10.1525\/9780520943773"},{"key":"36_CR23","unstructured":"Radford, A., et al.: Learning Transferable Visual Models From Natural Language Supervision, February 2021. https:\/\/arxiv.org\/abs\/2103.00020v1"},{"key":"36_CR24","doi-asserted-by":"publisher","unstructured":"Reimers, N., Gurevych, I.: Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks, August 2019. https:\/\/doi.org\/10.48550\/arXiv.1908.10084, http:\/\/arxiv.org\/abs\/1908.10084, arXiv:1908.10084 [cs]","DOI":"10.48550\/arXiv.1908.10084"},{"key":"36_CR25","doi-asserted-by":"publisher","unstructured":"Roy, D.B., et al.: Towards a standardized framework for AI-assisted, image-based monitoring of nocturnal insects. Philosophical Trans. Roy. Soc. B: Biol. Sci. 379(1904), 20230108 (2024). https:\/\/doi.org\/10.1098\/rstb.2023.0108, https:\/\/royalsocietypublishing.org\/doi\/10.1098\/rstb.2023.0108, publisher: Royal Society","DOI":"10.1098\/rstb.2023.0108"},{"key":"36_CR26","unstructured":"SLU Artdatabanken: Artfakta (2024). https:\/\/www.artfakta.se. Accessed 06 June 2025"},{"key":"36_CR27","doi-asserted-by":"publisher","unstructured":"Stevens, S., et al.: BioCLIP: a vision foundation model for the tree of life, May 2024. https:\/\/doi.org\/10.48550\/arXiv.2311.18803, http:\/\/arxiv.org\/abs\/2311.18803, arXiv:2311.18803 [cs]","DOI":"10.48550\/arXiv.2311.18803"},{"key":"36_CR28","doi-asserted-by":"publisher","unstructured":"Troisemaine, C., Lemaire, V., Gosselin, S., Reiffers-Masson, A., Flocon-Cholet, J., Vaton, S.: Novel Class Discovery: an Introduction and Key Concepts, February 2023. https:\/\/doi.org\/10.48550\/arXiv.2302.12028, http:\/\/arxiv.org\/abs\/2302.12028, arXiv:2302.12028 [cs]","DOI":"10.48550\/arXiv.2302.12028"},{"key":"36_CR29","doi-asserted-by":"publisher","unstructured":"Truong, T.D., Nguyen, H.Q., Nguyen, X.B., Dowling, A., Li, X., Luu, K.: Insect-Foundation: A Foundation Model and Large Multimodal Dataset for Vision-Language Insect Understanding, February 2025. https:\/\/doi.org\/10.48550\/arXiv.2502.09906, http:\/\/arxiv.org\/abs\/2502.09906, arXiv:2502.09906 [cs]","DOI":"10.48550\/arXiv.2502.09906"},{"key":"36_CR30","doi-asserted-by":"publisher","unstructured":"Vaze, S., Han, K., Vedaldi, A., Zisserman, A.: Generalized Category Discovery, June 2022. https:\/\/doi.org\/10.48550\/arXiv.2201.02609, http:\/\/arxiv.org\/abs\/2201.02609, arXiv:2201.02609 [cs]","DOI":"10.48550\/arXiv.2201.02609"},{"key":"36_CR31","doi-asserted-by":"publisher","unstructured":"Wagner, D.L., Grames, E.M., Forister, M.L., Berenbaum, M.R., Stopak, D.: Insect decline in the Anthropocene: death by a thousand cuts. Proceedings of the National Academy of Sciences 118(2), e2023989118 (2021). https:\/\/doi.org\/10.1073\/pnas.2023989118, https:\/\/www.pnas.org\/doi\/full\/10.1073\/pnas.2023989118, publisher:Proceedings of the National Academy of Sciences","DOI":"10.1073\/pnas.2023989118"},{"key":"36_CR32","doi-asserted-by":"publisher","unstructured":"Wong, M.K.L., Gu\u00e9nard, B., Lewis, O.T.: Trait-based ecology of terrestrial arthropods. Biological Reviews 94(3), 999\u20131022 (2019). https:\/\/doi.org\/10.1111\/brv.12488, https:\/\/onlinelibrary.wiley.com\/doi\/abs\/10.1111\/brv.12488, _eprint:https:\/\/onlinelibrary.wiley.com\/doi\/pdf\/10.1111\/brv.12488","DOI":"10.1111\/brv.12488"},{"key":"36_CR33","unstructured":"Zhai, X., Wang, X., Mustafa, B., Steiner, A., Keysers, D., Kolesnikov, A., Beyer, L.: LiT: Zero-Shot Transfer with Locked-image text Tuning, November 2021. https:\/\/arxiv.org\/abs\/2111.07991v3"},{"key":"36_CR34","doi-asserted-by":"publisher","unstructured":"Zhang, B., Zhang, P., Dong, X., Zang, Y., Wang, J.: Long-CLIP: Unlocking the Long-Text Capability of CLIP, July 2024. https:\/\/doi.org\/10.48550\/arXiv.2403.15378, http:\/\/arxiv.org\/abs\/2403.15378, arXiv:2403.15378 [cs]","DOI":"10.48550\/arXiv.2403.15378"}],"container-title":["Communications in Computer and Information Science","New Trends in Theory and Practice of Digital Libraries"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-032-06136-2_36","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,26]],"date-time":"2025-09-26T18:38:08Z","timestamp":1758911888000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-032-06136-2_36"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,9,27]]},"ISBN":["9783032061355","9783032061362"],"references-count":34,"URL":"https:\/\/doi.org\/10.1007\/978-3-032-06136-2_36","relation":{},"ISSN":["1865-0929","1865-0937"],"issn-type":[{"value":"1865-0929","type":"print"},{"value":"1865-0937","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,9,27]]},"assertion":[{"value":"27 September 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"The authors have no competing interests to declare that\u00a0are relevant to the content of this article.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Disclosure of Interests"}},{"value":"Source code, prompts and other supplementary material can be found at","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Source Code"}},{"value":"TPDL","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Theory and Practice of Digital Libraries","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Tampere","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Finland","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"23 September 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"26 September 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"tpdl2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/tpdl2025.github.io\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}