{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,2]],"date-time":"2025-08-02T05:00:02Z","timestamp":1754110802219},"publisher-location":"New York, NY, USA","reference-count":19,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2005,3,13]]},"DOI":"10.1145\/1066677.1066917","type":"proceedings-article","created":{"date-parts":[[2005,8,3]],"date-time":"2005-08-03T08:31:47Z","timestamp":1123057907000},"page":"1049-1053","update-policy":"http:\/\/dx.doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":16,"title":["Rule-based word clustering for document metadata extraction"],"prefix":"10.1145","author":[{"given":"Hui","family":"Han","sequence":"first","affiliation":[{"name":"Yahoo Inc., Sunnyvale, CA"}]},{"given":"Eren","family":"Manavoglu","sequence":"additional","affiliation":[{"name":"The Pennsylvania State University, PA"}]},{"given":"Hongyuan","family":"Zha","sequence":"additional","affiliation":[{"name":"The Pennsylvania State University, PA"}]},{"given":"Kostas","family":"Tsioutsiouliklis","sequence":"additional","affiliation":[{"name":"Yahoo Inc., Sunnyvale, CA"}]},{"given":"C. Lee","family":"Giles","sequence":"additional","affiliation":[{"name":"The Pennsylvania State University, PA"}]},{"given":"Xiangmin","family":"Zhang","sequence":"additional","affiliation":[{"name":"Rutgers University, New Brunswick, NJ"}]}],"member":"320","published-online":{"date-parts":[[2005,3,13]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1145\/290941.290970"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.3115\/974557.974586"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1145\/775152.775226"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1002\/(SICI)1097-4571(199009)41:6<391::AID-ASI1>3.0.CO;2-9"},{"key":"e_1_3_2_1_5_1","volume-title":"Machine Learning Research(JMLR)","author":"Dhillon I.","year":"2002","unstructured":"I. Dhillon , S. Manella , and R. Kumar . A divisive information-theoretic feature clustering for text classification . Machine Learning Research(JMLR) , 2002 . I. Dhillon, S. Manella, and R. Kumar. A divisive information-theoretic feature clustering for text classification. Machine Learning Research(JMLR), 2002."},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.5555\/516965.829161"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.5555\/827140.827146"},{"key":"e_1_3_2_1_8_1","volume-title":"Proceedings of Uncertainty in Artificial Intelligence","author":"Hofmann T.","year":"1999","unstructured":"T. Hofmann . Probabilistic latent semantic analysis . In Proceedings of Uncertainty in Artificial Intelligence , 1999 . T. Hofmann. Probabilistic latent semantic analysis. In Proceedings of Uncertainty in Artificial Intelligence, 1999."},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.1145\/564376.564412"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1023\/A:1009953814988"},{"key":"e_1_3_2_1_11_1","first-page":"305","volume-title":"Proceedings of the 5th International Joint Conference on Artificial Intelligence","author":"Mitchell T.","year":"1977","unstructured":"T. Mitchell . Version spaces : A candidate elimination approach to rule learning . In Proceedings of the 5th International Joint Conference on Artificial Intelligence , pages 305 -- 310 , 1977 . T. Mitchell. Version spaces: A candidate elimination approach to rule learning. In Proceedings of the 5th International Joint Conference on Artificial Intelligence, pages 305--310, 1977."},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.3115\/981574.981598"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.1109\/5.18626"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.3115\/1073336.1073360"},{"key":"e_1_3_2_1_15_1","volume-title":"Proceedings of AAAI 99 Workshop on Machine Learning for Information Extraction","author":"Seymore K.","year":"1999","unstructured":"K. Seymore , A. McCallum , and R. Rosenfeld . Learning hidden Markov model structure for information extraction . In Proceedings of AAAI 99 Workshop on Machine Learning for Information Extraction , 1999 . K. Seymore, A. McCallum, and R. Rosenfeld. Learning hidden Markov model structure for information extraction. In Proceedings of AAAI 99 Workshop on Machine Learning for Information Extraction, 1999."},{"key":"e_1_3_2_1_16_1","volume-title":"Proceedings of the 23rd European Colloquium on Information Retrieval Research","author":"Slonim N.","year":"2001","unstructured":"N. Slonim and N. Tishby . The power of word clusters for text classification . In Proceedings of the 23rd European Colloquium on Information Retrieval Research , 2001 . N. Slonim and N. Tishby. The power of word clusters for text classification. In Proceedings of the 23rd European Colloquium on Information Retrieval Research, 2001."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.5555\/827140.827147"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.5555\/211359"},{"key":"e_1_3_2_1_19_1","first-page":"412","volume-title":"Proceedings of the 14th International Conference on Machine Learning","author":"Yang Y.","year":"1997","unstructured":"Y. Yang and J. O. Pedersen . A comparative study on feature selection in text categorization . In Proceedings of the 14th International Conference on Machine Learning , pages 412 -- 420 , 1997 . Y. Yang and J. O. Pedersen. A comparative study on feature selection in text categorization. In Proceedings of the 14th International Conference on Machine Learning, pages 412--420, 1997."}],"event":{"name":"SAC05: The 2005 ACM Symposium on Applied Computing","sponsor":["SIGAPP ACM Special Interest Group on Applied Computing"],"location":"Santa Fe New Mexico","acronym":"SAC05"},"container-title":["Proceedings of the 2005 ACM symposium on Applied computing"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/1066677.1066917","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,7]],"date-time":"2023-01-07T19:29:37Z","timestamp":1673119777000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/1066677.1066917"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2005,3,13]]},"references-count":19,"alternative-id":["10.1145\/1066677.1066917","10.1145\/1066677"],"URL":"https:\/\/doi.org\/10.1145\/1066677.1066917","relation":{},"subject":[],"published":{"date-parts":[[2005,3,13]]},"assertion":[{"value":"2005-03-13","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}