{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,8]],"date-time":"2026-03-08T02:00:51Z","timestamp":1772935251634,"version":"3.50.1"},"reference-count":21,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,12,8]],"date-time":"2025-12-08T00:00:00Z","timestamp":1765152000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,12,8]],"date-time":"2025-12-08T00:00:00Z","timestamp":1765152000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,12,8]]},"DOI":"10.1109\/bigdata66926.2025.11402604","type":"proceedings-article","created":{"date-parts":[[2026,3,6]],"date-time":"2026-03-06T20:57:57Z","timestamp":1772830677000},"page":"7133-7142","source":"Crossref","is-referenced-by-count":0,"title":["Adaptation of Embedding Models to Financial Filings Via LLM Distillation"],"prefix":"10.1109","author":[{"given":"Eliot","family":"Brenner","sequence":"first","affiliation":[{"name":"Goldman Sachs,New York,NY,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Dominic","family":"Seyler","sequence":"additional","affiliation":[{"name":"Goldman Sachs,New York,NY,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Manjunath","family":"Hegde","sequence":"additional","affiliation":[{"name":"Goldman Sachs,New York,NY,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Andrei","family":"Simion","sequence":"additional","affiliation":[{"name":"Goldman Sachs,New York,NY,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Koustuv","family":"Dasgupta","sequence":"additional","affiliation":[{"name":"Goldman Sachs,New York,NY,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Bing","family":"Xiang","sequence":"additional","affiliation":[{"name":"Goldman Sachs,New York,NY,USA"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","volume-title":"Meta AI. Llama-3.1\u201370b-instruct model card","year":"2024"},{"key":"ref2","article-title":"Artificial Analysis","volume-title":"Artificial analysis ai review 2024 highlights","year":"2024"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.emnlp-industry.26"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1145\/3477495.3531863"},{"key":"ref5","volume-title":"How to do agentic rag on sec edgar filings","year":"2024"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2025.findings-acl.855"},{"key":"ref7","volume-title":"Statistical Power Analysis for the Behavioral Sciences","author":"Cohen","year":"1988"},{"key":"ref8","article-title":"From local to global: A graph RAG approach to query-focused summarization","author":"Edge","year":"2024","journal-title":"arXiv preprint"},{"key":"ref9","article-title":"Financebench: A new benchmark for financial question answering","author":"Islam","year":"2023","journal-title":"arXiv preprint"},{"key":"ref10","article-title":"Towards general text embeddings with multi-stage contrastive learning","author":"Li","year":"2023","journal-title":"arXiv preprint"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.emnlp-industry.66"},{"issue":"Nov","key":"ref12","first-page":"2579","article-title":"Visualizing data using t -sne","volume":"9","author":"Van der Maaten","year":"2008","journal-title":"Journal of machine learning research"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.econlp-1.5"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.acl-short.42"},{"key":"ref15","article-title":"Do we need domain-specific embedding models? an empirical investigation","author":"Tang","year":"2024","journal-title":"arXiv preprint"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2025.emnlp-main.179"},{"key":"ref17","volume-title":"EDGAR Filer Manual Volume II: EDGAR Filing. U.S. Securities and Exchange Commission","year":"2025"},{"key":"ref18","volume-title":"Edgar electronic data gathering, analysis, and retrieval system","year":"2025"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2025.emnlp-main.292"},{"key":"ref20","first-page":"5776","article-title":"Minilm: Deep self-attention distillation for task-agnostic compression of pre-trained transformers","volume":"33","author":"Wang","year":"2020","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.naacl-industry.23"}],"event":{"name":"2025 IEEE International Conference on Big Data (BigData)","location":"Macau, China","start":{"date-parts":[[2025,12,8]]},"end":{"date-parts":[[2025,12,11]]}},"container-title":["2025 IEEE International Conference on Big Data (BigData)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11400704\/11400712\/11402604.pdf?arnumber=11402604","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,7]],"date-time":"2026-03-07T07:27:32Z","timestamp":1772868452000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11402604\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,12,8]]},"references-count":21,"URL":"https:\/\/doi.org\/10.1109\/bigdata66926.2025.11402604","relation":{},"subject":[],"published":{"date-parts":[[2025,12,8]]}}}