{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,19]],"date-time":"2025-11-19T06:57:19Z","timestamp":1763535439649,"version":"3.28.0"},"reference-count":7,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016,12]]},"DOI":"10.1109\/bigdata.2016.7840747","type":"proceedings-article","created":{"date-parts":[[2017,2,7]],"date-time":"2017-02-07T21:46:59Z","timestamp":1486504019000},"page":"1394-1401","source":"Crossref","is-referenced-by-count":21,"title":["Empirical evaluations of preprocessing parameters' impact on predictive coding's effectiveness"],"prefix":"10.1109","author":[{"given":"Rishi","family":"Chhatwal","sequence":"first","affiliation":[]},{"given":"Nathaniel","family":"Huber-Fliflet","sequence":"additional","affiliation":[]},{"given":"Robert","family":"Keeling","sequence":"additional","affiliation":[]},{"given":"Jianping","family":"Zhang","sequence":"additional","affiliation":[]},{"given":"Haozhen","family":"Zhao","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref4","volume":"6","author":"japkowicz","year":"2002","journal-title":"The class imbalance problem A systematic study Intelligent data analysis 6"},{"key":"ref3","first-page":"412","article-title":"A Comparative Study on Feature Selection in Text Categorization","author":"yang","year":"0","journal-title":"Proceedings of the 14th International Conference on Machine Learning"},{"key":"ref6","article-title":"Beyond TFIDF weighting for text categorization in the vector space model","author":"soucy","year":"0","journal-title":"Proc of IJCAI"},{"key":"ref5","first-page":"137","article-title":"Text Categorization with Support Vector Machines: Learning with Many Relevant Features","author":"joachims","year":"0","journal-title":"Proceedings of the Tenth European Conference on Machine Learning (ECML)"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1145\/312624.312647"},{"key":"ref2","article-title":"Where the Money Goes: Understanding Litigant Expenditures for Producing Electronic Discovery","volume":"17","author":"nicholas","year":"2012"},{"journal-title":"The Age of Big Data New York Times","year":"2012","author":"steve","key":"ref1"}],"event":{"name":"2016 IEEE International Conference on Big Data (Big Data)","start":{"date-parts":[[2016,12,5]]},"location":"Washington DC,USA","end":{"date-parts":[[2016,12,8]]}},"container-title":["2016 IEEE International Conference on Big Data (Big Data)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7818133\/7840573\/07840747.pdf?arnumber=7840747","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2017,12,13]],"date-time":"2017-12-13T20:47:47Z","timestamp":1513198067000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7840747\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,12]]},"references-count":7,"URL":"https:\/\/doi.org\/10.1109\/bigdata.2016.7840747","relation":{},"subject":[],"published":{"date-parts":[[2016,12]]}}}