{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,21]],"date-time":"2026-01-21T08:20:13Z","timestamp":1768983613300,"version":"3.49.0"},"reference-count":32,"publisher":"IEEE","license":[{"start":{"date-parts":[[2020,12,10]],"date-time":"2020-12-10T00:00:00Z","timestamp":1607558400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,12,10]],"date-time":"2020-12-10T00:00:00Z","timestamp":1607558400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,12,10]],"date-time":"2020-12-10T00:00:00Z","timestamp":1607558400000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020,12,10]]},"DOI":"10.1109\/bigdata50022.2020.9378201","type":"proceedings-article","created":{"date-parts":[[2021,3,19]],"date-time":"2021-03-19T21:10:21Z","timestamp":1616188221000},"page":"2139-2148","source":"Crossref","is-referenced-by-count":18,"title":["Customizing Contextualized Language Models for Legal Document Reviews"],"prefix":"10.1109","author":[{"given":"Shohreh","family":"Shaghaghian","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Luna Yue","family":"Feng","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Borna","family":"Jafarpour","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Nicolai","family":"Pogrebnyakov","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref32","first-page":"2440","article-title":"Wiki-40b: Multilingual language model dataset","author":"guo","year":"2020","journal-title":"Proceedings of the 12th Language Resources and Evaluation Conference"},{"key":"ref31","article-title":"Huggingface's transformers: State-of-the-art natural language processing","author":"wolf","year":"2019"},{"key":"ref30","article-title":"Albert: A lite bert for self-supervised learning of language representations","author":"lan","year":"2019","journal-title":"Proceedings of the International Conference on Learning Representations (ICLR)"},{"key":"ref10","first-page":"72","article-title":"End-to-end open-domain question answering with bertserini","author":"yang","year":"2019","journal-title":"Proceedings of the International Conference of the North American Chapter of the Association for Computational Linguistics (Demonstrations)"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.11"},{"key":"ref12","first-page":"1234","article-title":"Biobert: a pretrained biomedical language representation model for biomedical text mining","volume":"36","author":"lee","year":"2020","journal-title":"Bioinformatics (Oxford England)"},{"key":"ref13","article-title":"Finbert: Financial sentiment analysis with pre-trained language models","author":"araci","year":"2019"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P18-1031"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N18-1202"},{"key":"ref16","article-title":"Scibert: Pretrained contextualized embeddings for scientific text","author":"beltagy","year":"2019"},{"key":"ref17","article-title":"Lstm-based deep learning models for non-factoid answer selection","author":"tan","year":"2015"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2013.6638947"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1145\/2939672.2939785"},{"key":"ref28","first-page":"9","article-title":"Distilling the knowledge in a neural network","volume":"1050","author":"hinton","year":"2015","journal-title":"Stat"},{"key":"ref4","first-page":"5998","article-title":"Attention is all you need","author":"vaswani","year":"2017","journal-title":"In Advances in neural information processing systems (NeurIPS)"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W18-5446"},{"key":"ref3","article-title":"A survey on neural network language models","author":"jing","year":"2019"},{"key":"ref6","doi-asserted-by":"crossref","DOI":"10.18653\/v1\/2020.findings-emnlp.261","article-title":"Legal-bert: The muppets straight out of law school","author":"chalkidis","year":"2020"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1145\/1150402.1150464"},{"key":"ref5","article-title":"Bert goes to law school: Quantifying the competitive advantage of access to large legal corpora in contract understanding","author":"elwany","year":"2019","journal-title":"Workshop on Document Intelligence at International Conference on Neural Information Processing Systems (NeurIPS)"},{"key":"ref8","article-title":"Bert: Pre-training of deep bidirectional transformers for language understanding","author":"devlin","year":"2019","journal-title":"Proceedings of the Annual Conference of the North American Chapter of the Association for Computational Linguistics Human Language Technologies (NAACL-HLT)"},{"key":"ref7","article-title":"Rapid adaptation of bert for information extraction on domain-specific business documents","author":"zhang","year":"2020"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2009.191"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/W19-4302"},{"key":"ref1","article-title":"Exploring the use of text classification in the legal domain","author":"sulea","year":"2017"},{"key":"ref20","first-page":"2132","article-title":"A review on deep learning techniques applied to answer selection","author":"lai","year":"2018","journal-title":"Proceedings of the International Conference On Computational Linguistics (COLING)"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1145\/3086512.3086528"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.2139\/ssrn.3338718"},{"key":"ref24","article-title":"Google's neural machine translation system: Bridging the gap between human and machine translation","author":"wu","year":"2016"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1016\/j.pragma.2005.02.003"},{"key":"ref26","article-title":"Distilbert, a distilled version of bert: smaller, faster, cheaper and lighter","author":"sanh","year":"2019"},{"key":"ref25","article-title":"Roberta: A robustly optimized bert pretraining approach","author":"liu","year":"2019"}],"event":{"name":"2020 IEEE International Conference on Big Data (Big Data)","location":"Atlanta, GA, USA","start":{"date-parts":[[2020,12,10]]},"end":{"date-parts":[[2020,12,13]]}},"container-title":["2020 IEEE International Conference on Big Data (Big Data)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9377717\/9377728\/09378201.pdf?arnumber=9378201","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,12,22]],"date-time":"2022-12-22T00:55:55Z","timestamp":1671670555000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9378201\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,12,10]]},"references-count":32,"URL":"https:\/\/doi.org\/10.1109\/bigdata50022.2020.9378201","relation":{},"subject":[],"published":{"date-parts":[[2020,12,10]]}}}