{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,21]],"date-time":"2025-11-21T12:02:24Z","timestamp":1763726544707,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":29,"publisher":"ACM","license":[{"start":{"date-parts":[[2011,10,24]],"date-time":"2011-10-24T00:00:00Z","timestamp":1319414400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2011,10,24]]},"DOI":"10.1145\/2063576.2063636","type":"proceedings-article","created":{"date-parts":[[2011,11,16]],"date-time":"2011-11-16T10:40:21Z","timestamp":1321440021000},"page":"383-392","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":35,"title":["Legal document clustering with built-in topic segmentation"],"prefix":"10.1145","author":[{"given":"Qiang","family":"Lu","sequence":"first","affiliation":[{"name":"Thomson Reuters, Rochester, NY, USA"}]},{"given":"Jack G.","family":"Conrad","sequence":"additional","affiliation":[{"name":"Thomson Reuters, Saint Paul, MN, USA"}]},{"given":"Khalid","family":"Al-Kofahi","sequence":"additional","affiliation":[{"name":"Thomson Reuters, Saint Paul, MN, USA"}]},{"given":"William","family":"Keenan","sequence":"additional","affiliation":[{"name":"Thomson Reuters, Rochester, NY, USA"}]}],"member":"320","published-online":{"date-parts":[[2011,10,24]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1145\/502585.502603"},{"key":"e_1_3_2_1_2_1","volume-title":"Proceedings of the DARPA Broadcast News Transcription and understanding Workshop","author":"Allen J.","year":"1998","unstructured":"J. Allen and et al. Topic detection and tracking pilot study -- final report . In Proceedings of the DARPA Broadcast News Transcription and understanding Workshop , 1998 . J. Allen and et al. Topic detection and tracking pilot study -- final report. In Proceedings of the DARPA Broadcast News Transcription and understanding Workshop, 1998."},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.3115\/976909.979665"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1007\/3-540-28349-8_2"},{"key":"e_1_3_2_1_5_1","first-page":"993","article-title":"Latent dirichlet allocation","volume":"3","author":"Blei D.","year":"2002","unstructured":"D. Blei , A. Ng , and M. Jordan . Latent dirichlet allocation . Journal of Machine Learning Research , 3 : 993 -- 1022 , 2002 . D. Blei, A. Ng, and M. Jordan. Latent dirichlet allocation. Journal of Machine Learning Research, 3:993--1022, 2002.","journal-title":"Journal of Machine Learning Research"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR.2000.906021"},{"key":"e_1_3_2_1_7_1","first-page":"26","volume-title":"Proceedings of the Association for Computational Linguistics","author":"Choi F.","year":"2000","unstructured":"F. Choi . Advances in domain independent linear text segmentation . In Proceedings of the Association for Computational Linguistics , pages 26 -- 33 , 2000 . F. Choi. Advances in domain independent linear text segmentation. In Proceedings of the Association for Computational Linguistics, pages 26--33, 2000."},{"key":"e_1_3_2_1_8_1","first-page":"109","volume-title":"Proceedings of EMNLP","author":"Choi F.","year":"2001","unstructured":"F. Choi , P. Wiemer-Hastings , and J. Moore . Latent semantic analysis for text segmentation . In Proceedings of EMNLP , pages 109 -- 117 , 2001 . F. Choi, P. Wiemer-Hastings, and J. Moore. Latent semantic analysis for text segmentation. In Proceedings of EMNLP, pages 109--117, 2001."},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1145\/1165485.1165513"},{"key":"e_1_3_2_1_10_1","volume-title":"Proceedings of the Sixth Symposium on Operating System Design and Implementation (OSDI04)","author":"Dean J.","year":"2004","unstructured":"J. Dean and S. Ghemawat . Mapreduce: Simplified data processing on large clusters . In Proceedings of the Sixth Symposium on Operating System Design and Implementation (OSDI04) , 2004 . J. Dean and S. Ghemawat. Mapreduce: Simplified data processing on large clusters. In Proceedings of the Sixth Symposium on Operating System Design and Implementation (OSDI04), 2004."},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1002\/(SICI)1097-4571(199009)41:6<391::AID-ASI1>3.0.CO;2-9"},{"volume-title":"http:\/\/hadoop.apache.org\/","year":"2010","key":"e_1_3_2_1_12_1","unstructured":"Apache hadoop. http:\/\/hadoop.apache.org\/ , 2010 . Apache hadoop. http:\/\/hadoop.apache.org\/, 2010."},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.5555\/972684.972687"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1145\/312624.312649"},{"key":"e_1_3_2_1_15_1","first-page":"225","volume-title":"Proceedings of the IEEE International Conference on Data Mining","author":"Hung M.C.","year":"2001","unstructured":"M.C. Hung and D.L. Yang . An efficient fuzzy c-means clustering algorithm . In Proceedings of the IEEE International Conference on Data Mining , pages 225 -- 232 , 2001 . M.C. Hung and D.L. Yang. An efficient fuzzy c-means clustering algorithm. In Proceedings of the IEEE International Conference on Data Mining, pages 225--232, 2001."},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.2002.1007544"},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.3115\/981574.981616"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.3115\/976744.976772"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.5555\/1855013"},{"volume-title":"http:\/\/lucene.apache.org\/mahout\/","year":"2010","key":"e_1_3_2_1_20_1","unstructured":"Apache mahout overview. http:\/\/lucene.apache.org\/mahout\/ , 2010 . Apache mahout overview. http:\/\/lucene.apache.org\/mahout\/, 2010."},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1145\/347090.347123"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.5555\/522936.790146"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/584792.584889"},{"key":"e_1_3_2_1_24_1","series-title":"Lecture Notes in Computer Science, 5032","volume-title":"A statistical model for topic segmentation and clustering","author":"Shafiei M.","year":"2008","unstructured":"M. Shafiei and E. Milios . A statistical model for topic segmentation and clustering . Lecture Notes in Computer Science, 5032 , 2008 . M. Shafiei and E. Milios. A statistical model for topic segmentation and clustering. Lecture Notes in Computer Science, 5032, 2008."},{"volume-title":"http:\/\/svmlight.joachims.org\/","year":"2010","key":"e_1_3_2_1_25_1","unstructured":"Svm light. http:\/\/svmlight.joachims.org\/ , 2010 . Svm light. http:\/\/svmlight.joachims.org\/, 2010."},{"key":"e_1_3_2_1_26_1","volume-title":"Proceedings of the Text Mining Workshop, SIAM Data Mining Conference","author":"Tagarelli A.","year":"2008","unstructured":"A. Tagarelli and G. Karypis . A segment-based approach to clustering multi-topic documents . In Proceedings of the Text Mining Workshop, SIAM Data Mining Conference , 2008 . A. Tagarelli and G. Karypis. A segment-based approach to clustering multi-topic documents. In Proceedings of the Text Mining Workshop, SIAM Data Mining Conference, 2008."},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.3115\/1073012.1073076"},{"key":"e_1_3_2_1_28_1","volume-title":"Automated clustering and extraction of distinctive words in legal documents. Dept. of computer science and engineering report","author":"Vaughn N.","year":"2001","unstructured":"N. Vaughn and D. Boley . Automated clustering and extraction of distinctive words in legal documents. Dept. of computer science and engineering report , University of Minnesota , 2001 . N. Vaughn and D. Boley. Automated clustering and extraction of distinctive words in legal documents. Dept. of computer science and engineering report, University of Minnesota, 2001."},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1145\/290941.290956"}],"event":{"name":"CIKM '11: International Conference on Information and Knowledge Management","sponsor":["SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web","SIGIR ACM Special Interest Group on Information Retrieval"],"location":"Glasgow Scotland, UK","acronym":"CIKM '11"},"container-title":["Proceedings of the 20th ACM international conference on Information and knowledge management"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2063576.2063636","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/2063576.2063636","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T09:54:11Z","timestamp":1750240451000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2063576.2063636"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2011,10,24]]},"references-count":29,"alternative-id":["10.1145\/2063576.2063636","10.1145\/2063576"],"URL":"https:\/\/doi.org\/10.1145\/2063576.2063636","relation":{},"subject":[],"published":{"date-parts":[[2011,10,24]]},"assertion":[{"value":"2011-10-24","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}