{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,24]],"date-time":"2026-03-24T14:00:29Z","timestamp":1774360829324,"version":"3.50.1"},"publisher-location":"Cham","reference-count":24,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783032212993","type":"print"},{"value":"9783032213006","type":"electronic"}],"license":[{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026]]},"DOI":"10.1007\/978-3-032-21300-6_33","type":"book-chapter","created":{"date-parts":[[2026,3,24]],"date-time":"2026-03-24T13:09:31Z","timestamp":1774357771000},"page":"427-435","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["MiNER: A Two-Stage Pipeline for\u00a0Metadata Extraction from\u00a0Municipal Meeting Minutes"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0009-0004-0431-6042","authenticated-orcid":false,"given":"Rodrigo","family":"Batista","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1365-0080","authenticated-orcid":false,"given":"Lu\u00eds Filipe","family":"Cunha","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8057-5338","authenticated-orcid":false,"given":"Purifica\u00e7\u00e3o","family":"Silvano","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2854-2891","authenticated-orcid":false,"given":"Nuno","family":"Guimar\u00e3es","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5475-1382","authenticated-orcid":false,"given":"Al\u00edpio","family":"Jorge","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1343-939X","authenticated-orcid":false,"given":"Evelin","family":"Amorim","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8767-8126","authenticated-orcid":false,"given":"Ricardo","family":"Campos","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2026,3,25]]},"reference":[{"key":"33_CR1","unstructured":"Abdin, M., et\u00a0al.: Phi-4 technical report. arXiv preprint arXiv:2412.08905 (2024)"},{"key":"33_CR2","doi-asserted-by":"publisher","unstructured":"Campos, R., et al.: CitiLink-minutes: a multilayer annotated dataset of municipal meeting minutes (2025). https:\/\/doi.org\/10.25747\/7KG6-1K22","DOI":"10.25747\/7KG6-1K22"},{"key":"33_CR3","volume-title":"Advances in Information Retrieval","author":"R Campos","year":"2026","unstructured":"Campos, R., et al.: Citilink-minutes: a multilayer annotated dataset of municipal meeting minutes. In: Anand, A., et al. (eds.) Advances in Information Retrieval. Springer Nature Switzerland, Cham (2026)"},{"key":"33_CR4","unstructured":"CodeCarbon team: codecarbon. https:\/\/codecarbon.io\/, Accessed 01 Oct 2025"},{"key":"33_CR5","unstructured":"Council data project: councilproject. https:\/\/councildataproject.org\/, Accessed 10 Oct 2025"},{"key":"33_CR6","unstructured":"deepset: xlm-roberta-large-squad2. https:\/\/huggingface.co\/deepset\/xlm-roberta-large-squad2, Accessed 11 Oct 2025"},{"key":"33_CR7","doi-asserted-by":"publisher","unstructured":"Erjavec, T., et\u00a0al.: The parlamint corpora of parliamentary proceedings. Language Res. Eval. 57, 415\u2013448 (2023). https:\/\/doi.org\/10.1007\/s10579-021-09574-0","DOI":"10.1007\/s10579-021-09574-0"},{"key":"33_CR8","unstructured":"Faker contributors: faker. https:\/\/pypi.org\/project\/Faker\/, Accessed 15 Sep 2025"},{"key":"33_CR9","doi-asserted-by":"publisher","unstructured":"Goel, A.: LangExtract (2025). https:\/\/github.com\/google\/langextract, https:\/\/doi.org\/10.5281\/zenodo.17015089","DOI":"10.5281\/zenodo.17015089"},{"key":"33_CR10","unstructured":"Hugging face: xlm-roberta. https:\/\/huggingface.co\/docs\/transformers\/model_doc\/xlm-roberta , Accessed 15 Sep 2025"},{"key":"33_CR11","doi-asserted-by":"publisher","unstructured":"Hyv\u00f6nen, E., et al.: Publishing and using parliamentary linked data on the semantic web: parliamentsampo system for parliament of finland. Semantic Web 16(1), SW\u2013243683 (2025). https:\/\/doi.org\/10.3233\/SW-243683, https:\/\/journals.sagepub.com\/doi\/abs\/10.3233\/SW-243683","DOI":"10.3233\/SW-243683"},{"key":"33_CR12","doi-asserted-by":"publisher","first-page":"261","DOI":"10.1007\/978-3-031-56063-7_17","volume-title":"Advances in Information Retrieval","author":"A Jain","year":"2024","unstructured":"Jain, A., Sharma, R.: Enhancing legal named entity recognition using roberta-gcn with CRF: a nuanced approach for fine-grained entity recognition. In: Goharian, N., Tonellotto, N., He, Y., Lipani, A., McDonald, G., Macdonald, C., Ounis, I. (eds.) Advances in Information Retrieval, pp. 261\u2013267. Springer Nature Switzerland, Cham (2024)"},{"key":"33_CR13","doi-asserted-by":"publisher","unstructured":"Karpukhin, V., et al.: Dense passage retrieval for open-domain question answering. In: Webber, B., Cohn, T., He, Y., Liu, Y. (eds.) Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP), pp. 6769\u20136781. Association for Computational Linguistics, Online (Nov 2020).https:\/\/doi.org\/10.18653\/v1\/2020.emnlp-main.550, https:\/\/aclanthology.org\/2020.emnlp-main.550\/","DOI":"10.18653\/v1\/2020.emnlp-main.550"},{"key":"33_CR14","unstructured":"LinguAligner developers: lingualigner. https:\/\/pypi.org\/project\/LinguAligner\/, Accessed 15 Sep 2025"},{"key":"33_CR15","doi-asserted-by":"crossref","unstructured":"Mor-Lan, G., Levi, E., Sheafer, T., Shenhav, S.R.: IsraParlTweet: the israeli parliamentary and twitter resource. In: Calzolari, N., Kan, M.Y., Hoste, V., Lenci, A., Sakti, S., Xue, N. (eds.) Proceedings of the 2024 Joint International Conference on Computational Linguistics, Language Resources and Evaluation (LREC-COLING 2024), pp. 9372\u20139381. ELRA and ICCL, Torino, Italia (2024). https:\/\/aclanthology.org\/2024.lrec-main.819\/","DOI":"10.63317\/3mghh7x7a7ix"},{"key":"33_CR16","doi-asserted-by":"crossref","unstructured":"Rajpurkar, P., Jia, R., Liang, P.: Know what you don\u2019t know: unanswerable questions for squad (2018). https:\/\/arxiv.org\/abs\/1806.03822","DOI":"10.18653\/v1\/P18-2124"},{"key":"33_CR17","doi-asserted-by":"crossref","unstructured":"Rajpurkar, P., Zhang, J., Lopyrev, K., Liang, P.: Squad: 100,000+ questions for machine comprehension of text (2016). https:\/\/arxiv.org\/abs\/1606.05250","DOI":"10.18653\/v1\/D16-1264"},{"key":"33_CR18","doi-asserted-by":"publisher","unstructured":"Robertson, S., Zaragoza, H.: The probabilistic relevance framework: Bm25 and beyond. Found. Trends Inf. Retrieval 3, 333\u2013389 (2009). https:\/\/doi.org\/10.1561\/1500000019","DOI":"10.1561\/1500000019"},{"issue":"3","key":"33_CR19","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s10664-020-09933-5","volume":"26","author":"A Sleimi","year":"2021","unstructured":"Sleimi, A., et al.: An automated framework for the extraction of semantic legal metadata from legal texts. Empir. Softw. Eng. 26(3), 1\u201350 (2021). https:\/\/doi.org\/10.1007\/s10664-020-09933-5","journal-title":"Empir. Softw. Eng."},{"key":"33_CR20","doi-asserted-by":"crossref","unstructured":"Sousa, H., Almeida, R., Silvano, P., Cantante, I., Campos, R., Jorge, A.: Enhancing portuguese variety identification with cross-domain approaches (2025). https:\/\/arxiv.org\/abs\/2502.14394","DOI":"10.1609\/aaai.v39i24.34705"},{"key":"33_CR21","doi-asserted-by":"publisher","first-page":"403","DOI":"10.1007\/978-3-030-61377-8_28","volume-title":"Intelligent Systems","author":"F Souza","year":"2020","unstructured":"Souza, F., Nogueira, R., Lotufo, R.: Bertimbau: Pretrained bert models for brazilian portuguese. In: Cerri, R., Prati, R.C. (eds.) Intelligent Systems, pp. 403\u2013417. Springer International Publishing, Cham (2020)"},{"key":"33_CR22","doi-asserted-by":"crossref","unstructured":"Spinosa, P., Giardiello, G., Cherubini, M., Marchi, S., Venturi, G., Montemagni, S.: Nlp-based metadata extraction for legal text consolidation. In: Proceedings of the 12th international conference on artificial intelligence and law, pp. 40\u201349 (2009)","DOI":"10.1145\/1568234.1568240"},{"key":"33_CR23","unstructured":"Team, G., et\u00a0al.: Gemini 1.5: unlocking multimodal understanding across millions of tokens of context. arXiv preprint arXiv:2403.05530 (2024)"},{"key":"33_CR24","doi-asserted-by":"publisher","first-page":"280","DOI":"10.1007\/978-981-96-0865-2_23","volume-title":"Sustainability and Empowerment in the Context of Digital Libraries","author":"Y Watanabe","year":"2025","unstructured":"Watanabe, Y., Ito, K., Matsubara, S.: Capabilities and challenges of LLMs in metadata extraction from scholarly papers. In: Oliver, G., Frings-Hessami, V., Du, J.T., Tezuka, T. (eds.) Sustainability and Empowerment in the Context of Digital Libraries, pp. 280\u2013287. Springer Nature Singapore, Singapore (2025)"}],"container-title":["Lecture Notes in Computer Science","Advances in Information Retrieval"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-032-21300-6_33","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,3,24]],"date-time":"2026-03-24T13:09:41Z","timestamp":1774357781000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-032-21300-6_33"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026]]},"ISBN":["9783032212993","9783032213006"],"references-count":24,"URL":"https:\/\/doi.org\/10.1007\/978-3-032-21300-6_33","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026]]},"assertion":[{"value":"25 March 2026","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"The authors have no competing interests to declare that are relevant to the content of this article.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Disclosure of Interests"}},{"value":"ECIR","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Information Retrieval","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Delft","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"The Netherlands","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2026","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 March 2026","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2 April 2026","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"48","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"ecir2026","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/ecir2026.eu\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}