{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,6]],"date-time":"2026-06-06T07:18:27Z","timestamp":1780730307971,"version":"3.54.1"},"reference-count":36,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2023,7,19]],"date-time":"2023-07-19T00:00:00Z","timestamp":1689724800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,7,19]],"date-time":"2023-07-19T00:00:00Z","timestamp":1689724800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100002322","name":"Coordena\u00e7\u00e3o de Aperfei\u00e7oamento de Pessoal de N\u00edvel Superior","doi-asserted-by":"publisher","award":["001"],"award-info":[{"award-number":["001"]}],"id":[{"id":"10.13039\/501100002322","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Jusbrasil Postdoctoral Fellowship Program"},{"name":"FAPEAM-POSGRAD 2022"},{"DOI":"10.13039\/501100003593","name":"Conselho Nacional de Desenvolvimento Cient\u00edfico e Tecnol\u00f3gico","doi-asserted-by":"publisher","award":["307248\/2019-4"],"award-info":[{"award-number":["307248\/2019-4"]}],"id":[{"id":"10.13039\/501100003593","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Artif Intell Law"],"published-print":{"date-parts":[[2024,12]]},"DOI":"10.1007\/s10506-023-09371-w","type":"journal-article","created":{"date-parts":[[2023,7,19]],"date-time":"2023-07-19T06:02:52Z","timestamp":1689746572000},"page":"1045-1074","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":9,"title":["A topic discovery approach for unsupervised organization of legal document collections"],"prefix":"10.1007","volume":"32","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2943-5211","authenticated-orcid":false,"given":"Daniela","family":"Vianna","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Edleno Silva","family":"de Moura","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Altigran Soares","family":"da Silva","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2023,7,19]]},"reference":[{"key":"9371_CR1","unstructured":"Angelov D (2020) Top2vec: distributed representations of topics. CoRR arXiv:2008.09470"},{"key":"9371_CR2","doi-asserted-by":"publisher","unstructured":"Badenes-Olmedo C, Redondo-Garc\u00eda JL, Corcho O (2019) Scalable cross-lingual document similarity through language-specific concept hierarchies. In: Proceedings of the 10th international conference on knowledge capture. Association for Computing Machinery, pp 147\u2013153. https:\/\/doi.org\/10.1145\/3360901.3364444","DOI":"10.1145\/3360901.3364444"},{"key":"9371_CR3","doi-asserted-by":"publisher","unstructured":"Bianchi F, Terragni S, Hovy D (2021) Pre-training is a hot topic: contextualized document embeddings improve topic coherence. In: Proceedings of the 59th annual meeting of the association for computational linguistics and the 11th international joint conference on natural language processing (volume 2: short papers). Association for Computational Linguistics, pp 759\u2013766. https:\/\/doi.org\/10.18653\/v1\/2021.acl-short.96","DOI":"10.18653\/v1\/2021.acl-short.96"},{"key":"9371_CR4","first-page":"993","volume":"3","author":"DM Blei","year":"2003","unstructured":"Blei DM, Ng AY, Jordan MI (2003) Latent Dirichlet allocation. J Mach Learn Res 3:993\u20131022","journal-title":"J Mach Learn Res"},{"key":"9371_CR5","doi-asserted-by":"publisher","unstructured":"Chalkidis I, Androutsopoulos I, Aletras N (2019a) Neural legal judgment prediction in English. In: Proceedings of the 57th annual meeting of the association for computational linguistics, pp 4317\u20134323. https:\/\/doi.org\/10.18653\/v1\/P19-1424","DOI":"10.18653\/v1\/P19-1424"},{"key":"9371_CR6","doi-asserted-by":"publisher","unstructured":"Chalkidis I, Fergadiotis E, Malakasiotis P, et\u00a0al (2019b) Large-scale multi-label text classification on EU legislation. In: Proceedings of the 57th annual meeting of the association for computational linguistics, pp 6314\u20136322. https:\/\/doi.org\/10.18653\/v1\/P19-1636","DOI":"10.18653\/v1\/P19-1636"},{"key":"9371_CR7","doi-asserted-by":"publisher","unstructured":"Chalkidis I, Fergadiotis M, Malakasiotis P, et\u00a0al (2020) LEGAL-BERT: the muppets straight out of law school. In: Findings of the association for computational linguistics: EMNLP 2020. Association for Computational Linguistics, pp 2898\u20132904. https:\/\/doi.org\/10.18653\/v1\/2020.findings-emnlp.261","DOI":"10.18653\/v1\/2020.findings-emnlp.261"},{"key":"9371_CR8","doi-asserted-by":"publisher","unstructured":"Devlin J, Chang MW, Lee K, et\u00a0al (2019) BERT: pre-training of deep bidirectional transformers for language understanding. In: Proceedings of the 2019 conference of the North American chapter of the association for computational linguistics: human language technologies, volume 1 (long and short papers), pp 4171\u20134186. https:\/\/doi.org\/10.18653\/v1\/N19-1423","DOI":"10.18653\/v1\/N19-1423"},{"key":"9371_CR9","doi-asserted-by":"publisher","first-page":"439","DOI":"10.1162\/tacl_a_00325","volume":"8","author":"AB Dieng","year":"2020","unstructured":"Dieng AB, Ruiz FJR, Blei DM (2020) Topic modeling in embedding spaces. Trans Assoc Comput Linguist 8:439\u2013453. https:\/\/doi.org\/10.1162\/tacl_a_00325","journal-title":"Trans Assoc Comput Linguist"},{"key":"9371_CR10","doi-asserted-by":"publisher","first-page":"75,022","DOI":"10.1109\/ACCESS.2020.2988493","volume":"8","author":"Y Fang","year":"2020","unstructured":"Fang Y, Tian X, Wu H et al (2020) Few-shot learning for Chinese legal controversial issues classification. IEEE Access 8:75,022-75,034. https:\/\/doi.org\/10.1109\/ACCESS.2020.2988493","journal-title":"IEEE Access"},{"key":"9371_CR11","unstructured":"Grootendorst M (2022) Bertopic: neural topic modeling with a class-based tf-idf procedure. CoRR arXiv:2203.05794"},{"key":"9371_CR12","doi-asserted-by":"publisher","unstructured":"Gupta P, Chaudhary Y, Sch\u00fctze H (2021) Multi-source neural topic modeling in multi-view embedding spaces. In: Proceedings of the 2021 conference of the North American chapter of the association for computational linguistics: human language technologies. Association for Computational Linguistics, pp 4205\u20134217. https:\/\/doi.org\/10.18653\/v1\/2021.naacl-main.332","DOI":"10.18653\/v1\/2021.naacl-main.332"},{"issue":"11","key":"9371_CR13","doi-asserted-by":"publisher","first-page":"15169","DOI":"10.1007\/s11042-018-6894-4","volume":"78","author":"H Jelodar","year":"2019","unstructured":"Jelodar H, Wang Y, Yuan C et al (2019) Latent Dirichlet allocation (LDA) and topic modeling: models, applications, a survey. Multimed Tools Appl 78(11):15169\u201315211. https:\/\/doi.org\/10.1007\/s11042-018-6894-4","journal-title":"Multimed Tools Appl"},{"key":"9371_CR14","doi-asserted-by":"publisher","unstructured":"Mandal A, Chaki R, Saha S, et\u00a0al (2017) Measuring similarity among legal court case documents. In: Proceedings of the 10th annual ACM India compute conference. Association for Computing Machinery, pp 1\u20139. https:\/\/doi.org\/10.1145\/3140107.3140119","DOI":"10.1145\/3140107.3140119"},{"key":"9371_CR15","doi-asserted-by":"crossref","unstructured":"McInnes L, Healy J, Melville J (2018) Umap: uniform manifold approximation and projection for dimension reduction. arXiv","DOI":"10.21105\/joss.00861"},{"key":"9371_CR16","unstructured":"Miao Y, Yu L, Blunsom P (2016) Neural variational inference for text processing. In: Proceedings of the 33rd international conference on international conference on machine learning, vol 48, pp 1727\u20131736"},{"key":"9371_CR17","unstructured":"Mikolov T, Chen K, Corrado GS, et\u00a0al (2013) Efficient estimation of word representations in vector space. In: International conference on learning representations"},{"key":"9371_CR18","unstructured":"Mikolov T, Grave E, Bojanowski P, et\u00a0al (2018) Advances in pre-training distributed word representations. In: Proceedings of the international conference on language resources and evaluation (LREC 2018)"},{"key":"9371_CR19","doi-asserted-by":"crossref","unstructured":"Nanda R, John AK, Caro LD, et\u00a0al (2017) Legal information retrieval using topic clustering and neural networks. In: Satoh K, Kim MY, Kano Y, et\u00a0al (eds) COLIEE 2017. 4th competition on legal information extraction and entailment, EPiC series in computing, vol\u00a047. EasyChair, pp 68\u201378","DOI":"10.29007\/psgx"},{"key":"9371_CR20","doi-asserted-by":"publisher","unstructured":"Pennington J, Socher R, Manning C (2014) GloVe: global vectors for word representation. In: Proceedings of the 2014 conference on empirical methods in natural language processing (EMNLP). Association for Computational Linguistics, Doha, Qatar, pp 1532\u20131543. https:\/\/doi.org\/10.3115\/v1\/D14-1162","DOI":"10.3115\/v1\/D14-1162"},{"key":"9371_CR21","doi-asserted-by":"crossref","unstructured":"Polo FM, Mendon\u00e7a GCF, Parreira KCJ, et\u00a0al (2021) Legalnlp-natural language processing methods for the Brazilian legal language. In: Anais do XVIII Encontro Nacional de Intelig\u00eancia Artificial e Computacional, pp 763\u2013774","DOI":"10.5753\/eniac.2021.18301"},{"key":"9371_CR22","doi-asserted-by":"crossref","unstructured":"Rahman MF, Liu W, Suhaim SB, et\u00a0al (2016) Hdbscan: density based clustering over location based services. ArXiv arXiv:1602.03730","DOI":"10.1109\/ICDE.2016.7498346"},{"key":"9371_CR23","doi-asserted-by":"publisher","unstructured":"Reimers N, Gurevych I (2019) Sentence-BERT: sentence embeddings using Siamese BERT-networks. In: Proceedings of the 2019 conference on empirical methods in natural language processing and the 9th international joint conference on natural language processing (EMNLP-IJCNLP). Association for Computational Linguistics, Hong Kong, China, pp 3982\u20133992. https:\/\/doi.org\/10.18653\/v1\/D19-1410","DOI":"10.18653\/v1\/D19-1410"},{"key":"9371_CR24","unstructured":"Rosa GM, Rodrigues RC, de\u00a0Alencar\u00a0Lotufo R, et\u00a0al (2021) Yes, BM25 is a strong baseline for legal case retrieval. CoRR arXiv:2105.05686"},{"key":"9371_CR25","doi-asserted-by":"publisher","unstructured":"Shao Y, Mao J, Liu Y, et\u00a0al (2020) Bert-pli: modeling paragraph-level interactions for legal case retrieval. In: Proceedings of the twenty-ninth international joint conference on artificial intelligence, IJCAI-20, pp 3501\u20133507. https:\/\/doi.org\/10.24963\/ijcai.2020\/484","DOI":"10.24963\/ijcai.2020\/484"},{"key":"9371_CR26","doi-asserted-by":"crossref","unstructured":"Souza F, Nogueira R, Lotufo R (2020) Bertimbau: pretrained Bert models for Brazilian Portuguese. In: Intelligent systems, pp 403\u2013417","DOI":"10.1007\/978-3-030-61377-8_28"},{"key":"9371_CR27","unstructured":"Srivastava A, Sutton C (2017) Autoencoding variational inference for topic models. In: International conference on learning representations"},{"key":"9371_CR28","doi-asserted-by":"crossref","unstructured":"Terragni S, Fersini E, Messina E (2021) Word embedding-based topic similarity measures. In: Natural language processing and information systems, pp 33\u201345","DOI":"10.1007\/978-3-030-80599-9_4"},{"key":"9371_CR29","unstructured":"Thompson L, Mimno D (2020) Topic modeling with contextualized word representation clusters. CoRR arXiv:https:\/\/arxiv.org\/abs\/2010.12626"},{"key":"9371_CR30","doi-asserted-by":"publisher","unstructured":"Tran V, Nguyen ML, Satoh K (2019) Building legal case retrieval systems with lexical matching and summarization using a pre-trained phrase scoring model. In: Proceedings of the seventeenth international conference on artificial intelligence and law, pp 275-282. https:\/\/doi.org\/10.1145\/3322640.3326740","DOI":"10.1145\/3322640.3326740"},{"key":"9371_CR31","doi-asserted-by":"publisher","unstructured":"Vianna D, Silva\u00a0de Moura E (2022) Organizing Portuguese legal documents through topic discovery. In: Proceedings of the 45th international ACM SIGIR conference on research and development in information retrieval. Association for Computing Machinery, SIGIR \u201922, p 3388-3392, https:\/\/doi.org\/10.1145\/3477495.3536329","DOI":"10.1145\/3477495.3536329"},{"issue":"1","key":"9371_CR32","doi-asserted-by":"publisher","first-page":"111","DOI":"10.1016\/j.ipm.2014.08.003","volume":"51","author":"I Vuli\u0107","year":"2015","unstructured":"Vuli\u0107 I, De Smet W, Tang J et al (2015) Probabilistic topic modeling in multilingual settings: an overview of its methodology and applications. Inf Process Manag 51(1):111\u2013147. https:\/\/doi.org\/10.1016\/j.ipm.2014.08.003","journal-title":"Inf Process Manag"},{"key":"9371_CR33","unstructured":"Wagner\u00a0Filho JA, Wilkens R, Idiart M, et\u00a0al (2018) The brWaC corpus: a new open resource for Brazilian Portuguese. In: Proceedings of the eleventh international conference on language resources and evaluation (LREC 2018). European Language Resources Association (ELRA), Miyazaki, Japan"},{"issue":"1145\/1852102","key":"9371_CR34","first-page":"1852106","volume":"10","author":"W Webber","year":"2010","unstructured":"Webber W, Moffat A, Zobel J (2010) A similarity measure for indefinite rankings. ACM Trans Inf Syst 10(1145\/1852102):1852106","journal-title":"ACM Trans Inf Syst"},{"key":"9371_CR35","doi-asserted-by":"crossref","unstructured":"Wu TH, Kao B, Chan F, et\u00a0al (2022) Semantic search and summarization of judgments using topic modeling. In: Legal knowledge and information systems: JURIX 2021: the thirty-fourth annual conference, Vilnius, Lithuania, 8\u201310 Dec 2021, p 100","DOI":"10.3233\/FAIA210323"},{"key":"9371_CR36","doi-asserted-by":"publisher","unstructured":"Zhong H, Guo Z, Tu C, et\u00a0al (2018) Legal judgment prediction via topological learning. In: Proceedings of the 2018 conference on empirical methods in natural language processing, pp 3540\u20133549. https:\/\/doi.org\/10.18653\/v1\/D18-1390","DOI":"10.18653\/v1\/D18-1390"}],"container-title":["Artificial Intelligence and Law"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10506-023-09371-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10506-023-09371-w\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10506-023-09371-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,23]],"date-time":"2024-10-23T12:10:30Z","timestamp":1729685430000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10506-023-09371-w"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,7,19]]},"references-count":36,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2024,12]]}},"alternative-id":["9371"],"URL":"https:\/\/doi.org\/10.1007\/s10506-023-09371-w","relation":{},"ISSN":["0924-8463","1572-8382"],"issn-type":[{"value":"0924-8463","type":"print"},{"value":"1572-8382","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023,7,19]]},"assertion":[{"value":"4 July 2023","order":1,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"19 July 2023","order":2,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}