{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,30]],"date-time":"2026-01-30T20:59:30Z","timestamp":1769806770549,"version":"3.49.0"},"reference-count":43,"publisher":"Springer Science and Business Media LLC","issue":"2","license":[{"start":{"date-parts":[[2026,1,30]],"date-time":"2026-01-30T00:00:00Z","timestamp":1769731200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,1,30]],"date-time":"2026-01-30T00:00:00Z","timestamp":1769731200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["SN COMPUT. SCI."],"DOI":"10.1007\/s42979-026-04735-w","type":"journal-article","created":{"date-parts":[[2026,1,30]],"date-time":"2026-01-30T11:13:59Z","timestamp":1769771639000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Impact of Domain Dependent Text Preprocessing on Summarization of Indian Legal Documents"],"prefix":"10.1007","volume":"7","author":[{"ORCID":"https:\/\/orcid.org\/0009-0003-0033-3913","authenticated-orcid":false,"family":"Nikita","sequence":"first","affiliation":[]},{"given":"Dipti P.","family":"Rana","sequence":"additional","affiliation":[]},{"given":"Rupa G.","family":"Mehta","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2026,1,30]]},"reference":[{"issue":"1","key":"4735_CR1","doi-asserted-by":"publisher","first-page":"110","DOI":"10.1108\/IJLMA-02-2021-0049","volume":"64","author":"SNS Chatterjee","year":"2022","unstructured":"Chatterjee S, N S. Artificial intelligence and human rights: a comprehensive study from Indian legal and policy perspective. Int J Law Manag. 2022;64(1):110\u201334. https:\/\/doi.org\/10.1108\/IJLMA-02-2021-0049.","journal-title":"Int J Law Manag"},{"issue":"8\/9","key":"4735_CR2","doi-asserted-by":"publisher","first-page":"593","DOI":"10.1108\/LR-09-2015-0095","volume":"65","author":"RK Bhardwaj","year":"2016","unstructured":"Bhardwaj RK, Margam M. Online legal information system for Indian environment: a user\u2019s perspectives. Libr Rev. 2016;65(8\/9):593\u2013624. https:\/\/doi.org\/10.1108\/LR-09-2015-0095.","journal-title":"Libr Rev"},{"issue":"3\/4","key":"4735_CR3","doi-asserted-by":"publisher","first-page":"251","DOI":"10.1108\/NLW-07-2015-0050","volume":"117","author":"RK Bhardwaj","year":"2016","unstructured":"Bhardwaj RK, Madhusudhan M. Comparative analysis of online legal information sources in Indian environment. New Libr World. 2016;117(3\/4):251\u201378. https:\/\/doi.org\/10.1108\/NLW-07-2015-0050.","journal-title":"New Libr World"},{"key":"4735_CR4","doi-asserted-by":"publisher","first-page":"413","DOI":"10.1007\/978-3-030-15712-8_27","volume-title":"Advances in information retrieval","author":"P Bhattacharya","year":"2019","unstructured":"Bhattacharya P, Hiware K, Rajgaria S, Pochhi N, Ghosh K, Ghosh S. A comparative study of summarization algorithms applied to legal case judgments. In: Azzopardi L, Stein B, Fuhr N, Mayr P, Hauff C, Hiemstra D, editors. Advances in information retrieval. Cham: Springer International Publishing; 2019. pp. 413\u201328."},{"key":"4735_CR5","unstructured":"Saravanan M, Ravindran B, Raman S. Improving Legal Document Summarization Using Graphical Models. In: Proceedings of the 2006 Conference on Legal Knowledge and Information Systems: JURIX 2006: The Nineteenth Annual Conference. NLD: IOS Press; 2006. pp. 51\u201360."},{"key":"4735_CR6","doi-asserted-by":"crossref","unstructured":"Sanchez G. Sentence Boundary Detection in Legal Text. In: Proceedings of the Natural Legal Language Processing Workshop 2019. Minneapolis, Minnesota: Association for Computational Linguistics; 2019. pp. 31\u201338. Available from: https:\/\/aclanthology.org\/W19-2204","DOI":"10.18653\/v1\/W19-2204"},{"key":"4735_CR7","first-page":"3","volume-title":"Legal knowledge and information systems","author":"P Bhattacharya","year":"2019","unstructured":"Bhattacharya P, Paul S, Ghosh K, Ghosh S, Wyner A. Identification of rhetorical roles of sentences in Indian legal judgments. In: Legal knowledge and information systems. IOS Press; 2019. p. 3\u201312."},{"key":"4735_CR8","doi-asserted-by":"crossref","unstructured":"Paul S, Goyal P, Ghosh S. Automatic Charge Identification from Facts: A Few Sentence-Level Charge Annotations is All You Need. In: Proceedings of the 28th International Conference on Computational Linguistics. Barcelona, Spain (Online): International Committee on Computational Linguistics; 2020.pp. 1011\u20131022. Available from: https:\/\/aclanthology.org\/2020.coling-main.88","DOI":"10.18653\/v1\/2020.coling-main.88"},{"key":"4735_CR9","doi-asserted-by":"publisher","unstructured":"Moens MF, Boiy E, Palau RM, Reed C. Automatic Detection of Arguments in Legal Texts. In: Proceedings of the 11th International Conference on Artificial Intelligence and Law. ICAIL \u201907. New York, NY, USA: Association for Computing Machinery; 2007. pp. 225\u2013230. Available from: https:\/\/doi.org\/10.1145\/1276318.1276362","DOI":"10.1145\/1276318.1276362"},{"key":"4735_CR10","doi-asserted-by":"publisher","unstructured":"Ghosh S, Dutta M, Das T. Indian Legal Text Summarization: A Text Normalization-based Approach, 2022 IEEE 19th India Council International Conference (INDICON), Kochi, India, 2022, pp. 1\u20134. https:\/\/doi.org\/10.1109\/INDICON56171.2022.10039891","DOI":"10.1109\/INDICON56171.2022.10039891"},{"key":"4735_CR11","doi-asserted-by":"publisher","DOI":"10.1016\/j.cosrev.2021.100388","volume":"40","author":"D Jain","year":"2021","unstructured":"Jain D, Borah MD, Biswas A. Summarization of legal documents: where are we now and the way forward. Comput Sci Rev. 2021;40:100388. https:\/\/doi.org\/10.1016\/j.cosrev.2021.100388.","journal-title":"Comput Sci Rev"},{"issue":"5","key":"4735_CR12","doi-asserted-by":"publisher","first-page":"2141","DOI":"10.1016\/j.jksuci.2019.11.015","volume":"34","author":"D Anand","year":"2022","unstructured":"Anand D, Wagh R. Effective deep learning approaches for summarization of legal texts. J King Saud Univ-Comput Inf Sci. 2022;34(5):2141\u201350. https:\/\/doi.org\/10.1016\/j.jksuci.2019.11.015.","journal-title":"J King Saud Univ-Comput Inf Sci"},{"key":"4735_CR13","doi-asserted-by":"publisher","first-page":"35","DOI":"10.1007\/978-981-13-8934-4_4","volume-title":"From Extractive to Abstractive Summarization: A Journey","author":"P Mehta","year":"2019","unstructured":"Mehta P, Majumder P. Domain-Specific Summarisation. In: From Extractive to Abstractive Summarization: A Journey. Springer Singapore; 2019. p. 35\u201348. https:\/\/doi.org\/10.1007\/978-981-13-8934-4_4."},{"issue":"6","key":"4735_CR14","doi-asserted-by":"publisher","first-page":"1748","DOI":"10.1016\/j.ipm.2007.01.005","volume":"43","author":"MF Moens","year":"2007","unstructured":"Moens MF. Summarizing court decisions. Inf Process Manag. 2007;43(6):1748\u201364. https:\/\/doi.org\/10.1016\/j.ipm.2007.01.005.","journal-title":"Inf Process Manag"},{"key":"4735_CR15","unstructured":"Zhao Z, Ning H, Liu L, Huang C, lei Kong L, Han Y, et al. FIRE2019@AILA: legal information retrieval using improved BM25. In: Fire; 2019."},{"key":"4735_CR16","unstructured":"More R, Patil J, Palaskar A, Pawde A. Removing Named Entities to Find Precedent Legal Cases. In: Mehta P, Rosso P, Majumder P, Mitra M, editors. Working Notes of FIRE 2019 - Forum for Information Retrieval Evaluation, Kolkata, India, December 12\u201315, 2019, vol. 2517. CEUR-WS.org; 2019. p. 13\u20138."},{"key":"4735_CR17","doi-asserted-by":"publisher","first-page":"53","DOI":"10.1007\/s10506-021-09304-5","volume":"31","author":"P Bhattacharya","year":"2023","unstructured":"Bhattacharya P, Paul S, Ghosh K, Ghosh S, Wyner A. Deeprhole: deep learning for rhetorical role labeling of sentences in legal case documents. Artif Intell Law. 2023;31:53\u201390. https:\/\/doi.org\/10.1007\/s10506-021-09304-5.","journal-title":"Artif Intell Law"},{"key":"4735_CR18","doi-asserted-by":"publisher","unstructured":"Gupta A, Furniturewala S, Kumari V, Sharma Y. Steno AI at SemEval-2023 Task 6: Rhetorical Role Labelling of Legal Documents using Transformers and Graph Neural Networks. In: Ojha AK, Do\u011fru\u00f6z AS, San Martino GD, Tayyar Madabushi H, Kumar R, Sartori E, editors. Proceedings of the 17th International Workshop on Semantic Evaluation (SemEval-2023). Association for Computational Linguistics; 2023. p. 1858\u201362. https:\/\/doi.org\/10.18653\/v1\/2023.semeval-1.256.","DOI":"10.18653\/v1\/2023.semeval-1.256"},{"key":"4735_CR19","unstructured":"Saravanan M, Ravindran B, Raman S. Automatic Identification of Rhetorical Roles using Conditional Random Fields for Legal Document Summarization. In: Proceedings of the Third International Joint Conference on Natural Language Processing: Volume-I; 2008. Available from: https:\/\/aclanthology.org\/I08-1063"},{"key":"4735_CR20","unstructured":"Farzindar A. (2004). Atefeh Farzindar and Guy Lapalme,\u2018LetSum, an automatic Legal Text Summarizing system\u2019in T. Gordon, editor, Legal Knowledge and Information Systems. Jurix 2004: The Seventeenth Annual Conference. Amsterdam: IOS Press, 2004, pp. 11\u201318. In Legal knowledge and information systems: JURIX 2004, the seventeenth annual conference (Vol. 120, p. 11). IOS Press."},{"key":"4735_CR21","first-page":"125","volume-title":"Legal knowledge and information systems","author":"I Nejadgholi","year":"2017","unstructured":"Nejadgholi I, Bougueng R, Witherspoon S. A semi-supervised training method for semantic search of legal facts in Canadian immigration cases. In: Legal knowledge and information systems. IOS Press; 2017. p. 125\u201334."},{"key":"4735_CR22","unstructured":"Venturi G. Design and development of TEMIS: a syntactically and semantically annotated corpus of italian legislative texts. In: proceedings of the workshop on semantic processing of legal texts (SPLeT 2012). Citeseer; 2012. pp. 1\u201312."},{"issue":"1","key":"4735_CR23","first-page":"4","volume":"4","author":"B Waltl","year":"2016","unstructured":"Waltl B, Matthes F, Waltl T, Grass T. Lexia: a data science environment for semantic analysis of German legal texts. Jusletter IT. 2016;4(1):4\u20131.","journal-title":"Jusletter IT"},{"key":"4735_CR24","doi-asserted-by":"publisher","first-page":"5497","DOI":"10.3233\/JIFS-189871","volume":"41","author":"J Dhanani","year":"2021","unstructured":"Dhanani J, Mehta R, Rana D. Legal document recommendation system: a cluster based pairwise similarity computation. J Intell Fuzzy Syst. 2021;41:5497\u2013509. https:\/\/doi.org\/10.3233\/JIFS-189871.","journal-title":"J Intell Fuzzy Syst"},{"key":"4735_CR25","doi-asserted-by":"publisher","first-page":"187","DOI":"10.1108\/IJWIS-02-2021-0015","volume":"17","author":"J Dhanani","year":"2021","unstructured":"Dhanani J, Mehta R, Rana DP. Legal document recommendation system: a dictionary based approach. Int J Web Inf Syst. 2021;17:187\u2013203. https:\/\/doi.org\/10.1108\/IJWIS-02-2021-0015.","journal-title":"Int J Web Inf Syst"},{"key":"4735_CR26","doi-asserted-by":"crossref","unstructured":"Trivedi A, Trivedi A, Varshney S, Joshipura V, Mehta R, Dhanani J. Extracted summary based recommendation system for Indian legal documents. In 2020 11th International Conference on Computing, Communication and Networking Technologies (ICCCNT) (pp. 1\u20136). IEEE 2020.","DOI":"10.1109\/ICCCNT49239.2020.9225290"},{"key":"4735_CR27","doi-asserted-by":"publisher","unstructured":"Bhattacharya P, Poddar S, Rudra K, Ghosh K, Ghosh S. Incorporating Domain Knowledge for Extractive Summarization of Legal Case Documents. In: Proceedings of the Eighteenth International Conference on Artificial Intelligence and Law. ICAIL \u201921. New York, NY, USA: Association for Computing Machinery; 2021. pp. 22\u201331. Available from: https:\/\/doi.org\/10.1145\/3462757.3466092","DOI":"10.1145\/3462757.3466092"},{"key":"4735_CR28","doi-asserted-by":"publisher","unstructured":"Bhattacharya P, Ghosh K, Ghosh S, Pal A, Mehta P, Bhattacharya A et al. FIRE 2019 AILA Track: Artificial Intelligence for Legal Assistance. In: Proceedings of the 11th Annual Meeting of the Forum for Information Retrieval Evaluation. FIRE \u201919. New York, NY, USA: Association for Computing Machinery; 2019. pp. 4\u20136. Available from: https:\/\/doi.org\/10.1145\/3368567.3368587","DOI":"10.1145\/3368567.3368587"},{"key":"4735_CR29","doi-asserted-by":"publisher","unstructured":"Bhattacharya P, Mehta P, Ghosh K, Ghosh S, Pal A, Bhattacharya A et al. FIRE 2020 AILA Track: Artificial Intelligence for Legal Assistance. In: Proceedings of the 12th Annual Meeting of the Forum for Information Retrieval Evaluation. FIRE \u201920. New York, NY, USA: Association for Computing Machinery; 2021. pp. 1\u20133. Available from: https:\/\/doi.org\/10.1145\/3441501.3441510","DOI":"10.1145\/3441501.3441510"},{"issue":"1","key":"4735_CR30","doi-asserted-by":"publisher","DOI":"10.1007\/s42979-022-01446-w","volume":"4","author":"G Sharma","year":"2022","unstructured":"Sharma G, Sharma D. Automatic text summarization methods: a comprehensive review. SN Comput Sci. 2022;4(1):33. https:\/\/doi.org\/10.1007\/s42979-022-01446-w.","journal-title":"SN Comput Sci"},{"issue":"4","key":"4735_CR31","doi-asserted-by":"publisher","DOI":"10.1007\/s42979-023-01806-0","volume":"4","author":"SR Chowdhury","year":"2023","unstructured":"Chowdhury SR, Sarkar K. A new method for extractive text summarization using neural networks. SN Comput Sci. 2023;4(4):384. https:\/\/doi.org\/10.1007\/s42979-023-01806-0.","journal-title":"SN Comput Sci"},{"key":"4735_CR32","doi-asserted-by":"crossref","unstructured":"Merchant K, Pande Y. NLP Based Latent Semantic Analysis for Legal Text Summarization. In: 2018 International Conference on Advances in Computing, Communications and Informatics (ICACCI); 2018. pp. 1803\u20131807.","DOI":"10.1109\/ICACCI.2018.8554831"},{"issue":"7","key":"4735_CR33","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/s42979-024-03277-3","volume":"5","author":"S Sharma","year":"2024","unstructured":"Sharma S, Singh PP. Advancing legal document summarization: introducing an approach using a recursive summarization algorithm. SN Comput Sci. 2024;5(7):1\u201320. https:\/\/doi.org\/10.1007\/s42979-024-03277-3.","journal-title":"SN Comput Sci"},{"key":"4735_CR34","doi-asserted-by":"publisher","DOI":"10.1007\/s10506-024-09411-z","author":"A Deroy","year":"2024","unstructured":"Deroy A, Ghosh K, Ghosh S. Applicability of large language models and generative models for legal case judgement summarization. Artif Intell Law. 2024. https:\/\/doi.org\/10.1007\/s10506-024-09411-z.","journal-title":"Artif Intell Law"},{"key":"4735_CR35","doi-asserted-by":"publisher","DOI":"10.1007\/s44443-025-00022-5","author":"W Gao","year":"2025","unstructured":"Gao W, Yu S, Qin Y, Yang C, Huang R, Chen Y, et al. LSDK-legalsum: improving legal judgment summarization using logical structure and domain knowledge. J King Saud Univ Comput Inf Sci. 2025. https:\/\/doi.org\/10.1007\/s44443-025-00022-5.","journal-title":"J King Saud Univ Comput Inf Sci"},{"issue":"4","key":"4735_CR36","doi-asserted-by":"publisher","DOI":"10.1007\/s13198-025-02783-8","volume":"16","author":"S Sharma","year":"2025","unstructured":"Sharma S, Singh PP. Advancements in legal text summarization: integrating InLegalBERT for effective extractive summarization. Int J Syst Assur Eng Manag. 2025;123456789. https:\/\/doi.org\/10.1007\/s13198-025-02783-8.","journal-title":"Int J Syst Assur Eng Manag"},{"key":"4735_CR37","doi-asserted-by":"publisher","first-page":"231","DOI":"10.1007\/s10506-023-09349-8","volume":"32","author":"A Deroy","year":"2024","unstructured":"Deroy A, Ghosh K, Ghosh S, Springer Netherlands. Ensemble methods for improving extractive summarization of legal case judgements. Artif Intell Law. 2024;32:231\u201389. https:\/\/doi.org\/10.1007\/s10506-023-09349-8.","journal-title":"Artif Intell Law"},{"key":"4735_CR38","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2023.121571","volume":"237","author":"D Jain","year":"2024","unstructured":"Jain D, Borah MD, Biswas A. Summarization of lengthy legal documents via abstractive dataset building: an extract-then-assign approach. Expert Syst Appl. 2024;237(PB):121571. https:\/\/doi.org\/10.1016\/j.eswa.2023.121571.","journal-title":"Expert Syst Appl"},{"key":"4735_CR39","unstructured":"Polsley S, Jhunjhunwala P, Huang R, CaseSummarizer. A System for Automated Summarization of Legal Texts. In: Proceedings of COLING 2016, the 26th International Conference on Computational Linguistics: System Demonstrations. Osaka, Japan: The COLING 2016 Organizing Committee; 2016. pp. 258\u2013262. Available from: https:\/\/aclanthology.org\/C16-2054"},{"key":"4735_CR40","unstructured":"Lin CY. ROUGE: A Package for Automatic Evaluation of Summaries. In: Text Summarization Branches Out. Barcelona, Spain: Association for Computational Linguistics; 2004. pp. 74\u201381. Available from: https:\/\/aclanthology.org\/W04-1013"},{"key":"4735_CR41","unstructured":"Zhang T, Kishore V, Wu F, Weinberger KQ, Artzi Y. BERTScore: Evaluating Text Generation with BERT. arXiv. Available from: https:\/\/arxiv.org\/abs\/1904 .09675."},{"key":"4735_CR42","unstructured":"Banerjee S, Lavie A. METEOR: An Automatic Metric for MT Evaluation with Improved Correlation with Human Judgments. In: Goldstein J, Lavie A, Lin CY, Voss C, editors. Proceedings of the ACL workshop on Intrinsic and Extrinsic Evaluation Measures for Machine Translation and\/or Summarization. Ann Arbor, Michigan: Association for Computational Linguistics;2005. pp. 65\u201372. Available from: https:\/\/aclanthology.org\/W05-0909."},{"key":"4735_CR43","doi-asserted-by":"publisher","unstructured":"Zhao Z, Cohen SB, Webber B. Reducing Quantity Hallucinations in Abstractive Summarization. In: Cohn T, He Y, Liu Y, editors. Findings of the Association for Computational Linguistics: EMNLP 2020. Association for Computational Linguistics; 2020. p. 2237\u201349. https:\/\/doi.org\/10.18653\/v1\/2020.findings-emnlp.203.","DOI":"10.18653\/v1\/2020.findings-emnlp.203"}],"container-title":["SN Computer Science"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s42979-026-04735-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s42979-026-04735-w","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s42979-026-04735-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,1,30]],"date-time":"2026-01-30T11:14:03Z","timestamp":1769771643000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s42979-026-04735-w"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,1,30]]},"references-count":43,"journal-issue":{"issue":"2","published-online":{"date-parts":[[2026,2]]}},"alternative-id":["4735"],"URL":"https:\/\/doi.org\/10.1007\/s42979-026-04735-w","relation":{},"ISSN":["2661-8907"],"issn-type":[{"value":"2661-8907","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,1,30]]},"assertion":[{"value":"24 July 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"6 January 2026","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"30 January 2026","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"On behalf of all authors, the corresponding author states that there is no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}],"article-number":"148"}}