{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,21]],"date-time":"2026-03-21T21:51:11Z","timestamp":1774129871609,"version":"3.50.1"},"publisher-location":"Cham","reference-count":23,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031790317","type":"print"},{"value":"9783031790324","type":"electronic"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-79032-4_2","type":"book-chapter","created":{"date-parts":[[2025,1,29]],"date-time":"2025-01-29T22:14:28Z","timestamp":1738188868000},"page":"19-32","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["GovBERT-BR: A BERT-Based Language Model for\u00a0Brazilian Portuguese Governmental Data"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-0110-9924","authenticated-orcid":false,"given":"Mariana O.","family":"Silva","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7210-6408","authenticated-orcid":false,"given":"Gabriel P.","family":"Oliveira","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-8898-4237","authenticated-orcid":false,"given":"Lucas G. L.","family":"Costa","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0349-4494","authenticated-orcid":false,"given":"Gisele L.","family":"Pappa","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,1,30]]},"reference":[{"key":"2_CR1","doi-asserted-by":"crossref","unstructured":"Al-Qurishi, M., AlQaseemi, S., Souissi, R.: Aralegal-bert: a pretrained language model for arabic legal text. In: NLLP@EMNLP, pp. 338\u2013344. Association for Computational Linguistics (2022)","DOI":"10.18653\/v1\/2022.nllp-1.31"},{"key":"2_CR2","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"557","DOI":"10.1007\/978-3-030-91699-2_38","volume-title":"Intelligent Systems","author":"R Aragy","year":"2021","unstructured":"Aragy, R., Fernandes, E.R., Caceres, E.N.: Rhetorical role identification for portuguese legal documents. In: Britto, A., Valdivia Delgado, K. (eds.) BRACIS 2021. LNCS (LNAI), vol. 13074, pp. 557\u2013571. Springer, Cham (2021). https:\/\/doi.org\/10.1007\/978-3-030-91699-2_38"},{"issue":"2","key":"2_CR3","doi-asserted-by":"publisher","first-page":"74","DOI":"10.3390\/info15020074","volume":"15","author":"M Bogdanovic","year":"2024","unstructured":"Bogdanovic, M., Kocic, J., Stoimenov, L.: Srberta - a transformer language model for serbian cyrillic legal texts. Information 15(2), 74 (2024)","journal-title":"Information"},{"key":"2_CR4","doi-asserted-by":"publisher","unstructured":"Brand\u00e3o, M.A., et\u00a0al.: PLUS: a semi-automated pipeline for fraud detection in public bids. Digit. Gov. Res. Pract. 5(1), 5:1\u20135:16 (2024). https:\/\/doi.org\/10.1145\/3616396","DOI":"10.1145\/3616396"},{"key":"2_CR5","doi-asserted-by":"publisher","unstructured":"Constantino, K., et\u00a0al.: Segmenta\u00e7\u00e3o e Classifica\u00e7\u00e3o Sem\u00e2ntica de Trechos de Di\u00e1rios Oficiais Usando Aprendizado Ativo. In: SBBD, pp. 304\u2013316. SBC (2022).https:\/\/doi.org\/10.5753\/sbbd.2022.224656","DOI":"10.5753\/sbbd.2022.224656"},{"key":"2_CR6","doi-asserted-by":"publisher","unstructured":"Devlin, J., Chang, M., Lee, K., Toutanova, K.: BERT: pre-training of deep bidirectional transformers for language understanding. In: NAACL-HLT, pp. 4171\u20134186. Association for Computational Linguistics (2019).https:\/\/doi.org\/10.18653\/v1\/n19-1423","DOI":"10.18653\/v1\/n19-1423"},{"key":"2_CR7","doi-asserted-by":"crossref","unstructured":"Gao, S., Gao, L., Li, Q., Xu, J.: Application of large language model in intelligent Q &A of digital government. In: CNCIT, pp. 24\u201327. ACM (2023)","DOI":"10.1145\/3605801.3605806"},{"key":"2_CR8","unstructured":"Garcia, E.A.S., et al.: Robertalexpt: a legal roberta model pretrained with deduplication for portuguese. In: PROPOR, pp. 374\u2013383. ACL (2024)"},{"key":"2_CR9","doi-asserted-by":"publisher","first-page":"8633","DOI":"10.1109\/ACCESS.2024.3349969","volume":"12","author":"J Han","year":"2024","unstructured":"Han, J., Lu, J., Xu, Y., You, J., Wu, B.: Intelligent practices of large language models in digital government services. IEEE Access 12, 8633\u20138640 (2024)","journal-title":"IEEE Access"},{"key":"2_CR10","doi-asserted-by":"publisher","unstructured":"Hott, H.R., Silva, M.O., Oliveira, G.P., Brand\u00e3o, M.A., Lacerda, A., Pappa, G.L.: Evaluating contextualized embeddings for topic modeling in public bidding domain. In: BRACIS. LNCS, vol. 14197, pp. 410\u2013426. Springer, Cham (2023). https:\/\/doi.org\/10.1007\/978-3-031-45392-2_27","DOI":"10.1007\/978-3-031-45392-2_27"},{"key":"2_CR11","doi-asserted-by":"publisher","DOI":"10.1016\/j.clsr.2023.105908","volume":"52","author":"D Licari","year":"2024","unstructured":"Licari, D., Comand\u00e9, G.: ITALIAN-LEGAL-BERT models for improving natural language processing tasks in the italian legal domain. Comput. Law Secur. Rev. 52, 105908 (2024)","journal-title":"Comput. Law Secur. Rev."},{"key":"2_CR12","unstructured":"Lins, A.A., Carvalho, C.S., das Chagas Juc\u00e1\u00a0Bomfim, F., de\u00a0Carvalho\u00a0Bentes, D., Pinheiro, V.: CLSJUR.BR - a model for abstractive summarization of legal documents in portuguese language based on contrastive learning. In: PROPOR, pp. 321\u2013331. ACL (2024)"},{"key":"2_CR13","unstructured":"Luz de Araujo, P.H., de\u00a0Campos, T.E., Braz, F.A., da\u00a0Silva, N.C.: VICTOR: a dataset for Brazilian legal documents classification. In: LREC, pp. 1449\u20131458. ELRA (2020)"},{"key":"2_CR14","doi-asserted-by":"crossref","unstructured":"Mamalis, M.E., Kalampokis, E., Karamanou, A., Brimos, P., Tarabanis, K.A.: Can large language models revolutionalize open government data portals? A case of using chatgpt in statistics.gov.scot. In: PCI, pp. 53\u201359. ACM (2023)","DOI":"10.31219\/osf.io\/9b35z"},{"key":"2_CR15","doi-asserted-by":"crossref","unstructured":"Miyazaki, K., Yamada, H., Tokunaga, T.: Cross-domain analysis on japanese legal pretrained language models. In: AACL\/IJCNLP (Findings), pp. 274\u2013281. Association for Computational Linguistics (2022)","DOI":"10.18653\/v1\/2022.findings-aacl.26"},{"key":"2_CR16","doi-asserted-by":"publisher","unstructured":"Polo, F.M., Ciochetti, I., Bertolo, E.: Predicting legal proceedings status: approaches based on sequential text data. In: ICAIL, pp. 264\u2013265. ACM (2021). https:\/\/doi.org\/10.1145\/3462757.3466138","DOI":"10.1145\/3462757.3466138"},{"key":"2_CR17","doi-asserted-by":"publisher","unstructured":"Silva, M.O., et\u00a0al.: LiPSet: Um Conjunto de Dados com Documentos Rotulados de Licita\u00e7\u00f5es P\u00fablicas. In: DSW, pp. 13\u201324. SBC (2022). https:\/\/doi.org\/10.5753\/dsw.2022.224925","DOI":"10.5753\/dsw.2022.224925"},{"key":"2_CR18","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"104","DOI":"10.1007\/978-3-030-91699-2_8","volume-title":"Intelligent Systems","author":"NFF Silva","year":"2021","unstructured":"Silva, N.F.F., et al.: Evaluating topic models in portuguese political comments about bills from brazil\u2019s chamber of deputies. In: Britto, A., Valdivia Delgado, K. (eds.) BRACIS 2021. LNCS (LNAI), vol. 13074, pp. 104\u2013120. Springer, Cham (2021). https:\/\/doi.org\/10.1007\/978-3-030-91699-2_8"},{"key":"2_CR19","series-title":"Lecture Notes in Computer Science (Lecture Notes in Artificial Intelligence)","doi-asserted-by":"publisher","first-page":"403","DOI":"10.1007\/978-3-030-61377-8_28","volume-title":"Intelligent Systems","author":"F Souza","year":"2020","unstructured":"Souza, F., Nogueira, R., Lotufo, R.: BERTimbau: pretrained BERT models for Brazilian Portuguese. In: Cerri, R., Prati, R.C. (eds.) BRACIS 2020. LNCS (LNAI), vol. 12319, pp. 403\u2013417. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-61377-8_28"},{"key":"2_CR20","doi-asserted-by":"publisher","unstructured":"de\u00a0V.\u00a0Silveira, R., Ponte, C., Almeida, V., Pinheiro, V., Furtado, V.: LegalBert-pt: a pretrained language model for the Brazilian Portuguese legal domain. In: BRACIS. LNCS, vol. 14197, pp. 268\u2013282. Springer, Cham (2023). https:\/\/doi.org\/10.1007\/978-3-031-45392-2_18","DOI":"10.1007\/978-3-031-45392-2_18"},{"key":"2_CR21","doi-asserted-by":"crossref","unstructured":"Viegas, C.F.O., Costa, B.C., Ishii, R.P.: Jurisbert: a new approach that converts a classification corpus into an STS one. In: ICCSA. LNCS, vol. 13956, pp. 349\u2013365. Springer, Cham (2023)","DOI":"10.1007\/978-3-031-36805-9_24"},{"key":"2_CR22","doi-asserted-by":"publisher","first-page":"79","DOI":"10.1016\/j.aiopen.2021.06.003","volume":"2","author":"C Xiao","year":"2021","unstructured":"Xiao, C., Hu, X., Liu, Z., Tu, C., Sun, M.: Lawformer: a pre-trained language model for chinese legal long documents. AI Open 2, 79\u201384 (2021)","journal-title":"AI Open"},{"issue":"3","key":"2_CR23","doi-asserted-by":"publisher","first-page":"46","DOI":"10.3390\/data8030046","volume":"8","author":"IN Yulita","year":"2023","unstructured":"Yulita, I.N., Wijaya, V., Rosadi, R., Sarathan, I., Djuyandi, Y., Prabuwono, A.S.: Analysis of government policy sentiment regarding vacation during the COVID-19 pandemic using the bidirectional encoder representation from transformers (BERT). Data 8(3), 46 (2023)","journal-title":"Data"}],"container-title":["Lecture Notes in Computer Science","Intelligent Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-79032-4_2","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,1,29]],"date-time":"2025-01-29T22:14:31Z","timestamp":1738188871000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-79032-4_2"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9783031790317","9783031790324"],"references-count":23,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-79032-4_2","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"30 January 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"BRACIS","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Brazilian Conference on Intelligent Systems","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Bel\u00e9m do Par\u00e1","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Brazil","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"17 November 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"21 November 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"34","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"bracis2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}