{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,2]],"date-time":"2026-01-02T07:49:21Z","timestamp":1767340161861,"version":"build-2065373602"},"publisher-location":"Republic and Canton of Geneva, Switzerland","reference-count":47,"publisher":"International World Wide Web Conferences Steering Committee","license":[{"start":{"date-parts":[[2015,5,18]],"date-time":"2015-05-18T00:00:00Z","timestamp":1431907200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2015,5,18]]},"DOI":"10.1145\/2736277.2741628","type":"proceedings-article","created":{"date-parts":[[2016,2,5]],"date-time":"2016-02-05T20:37:12Z","timestamp":1454704632000},"page":"960-970","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":22,"title":["N-gram IDF"],"prefix":"10.1145","author":[{"given":"Masumi","family":"Shirakawa","sequence":"first","affiliation":[{"name":"Osaka University, Osaka, Japan"}]},{"given":"Takahiro","family":"Hara","sequence":"additional","affiliation":[{"name":"Osaka University, Osaka, Japan"}]},{"given":"Shojiro","family":"Nishio","sequence":"additional","affiliation":[{"name":"Osaka University, Osaka, Japan"}]}],"member":"320","published-online":{"date-parts":[[2015,5,18]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1016\/S1570-8667(03)00065-0"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1016\/S0306-4573(02)00021-3"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1109\/18.681318"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/28869.28873"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1002\/asi.4630250505"},{"key":"e_1_3_2_1_6_1","first-page":"31","volume-title":"Normalized (Pointwise) Mutual Information in Collocation Extraction. In Proceedings of International Conference of the German Society for Computational Linguistics and Language Technology (GSCL)","author":"Bouma G.","year":"2009","unstructured":"G. Bouma . Normalized (Pointwise) Mutual Information in Collocation Extraction. In Proceedings of International Conference of the German Society for Computational Linguistics and Language Technology (GSCL) , pages 31 -- 40 , Sep.\/ Oct. 2009 . G. Bouma. Normalized (Pointwise) Mutual Information in Collocation Extraction. In Proceedings of International Conference of the German Society for Computational Linguistics and Language Technology (GSCL), pages 31--40, Sep.\/Oct. 2009."},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.5555\/1873781.1873795"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1017\/S1351324900000139"},{"key":"e_1_3_2_1_9_1","doi-asserted-by":"publisher","DOI":"10.5555\/89086.89095"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1109\/TIT.2005.844059"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2007.48"},{"key":"e_1_3_2_1_12_1","first-page":"369","volume-title":"Proceedings of Meeting on Mathematics of Language (MOL)","author":"da Silva J. F.","year":"1999","unstructured":"J. F. da Silva and J. G. P. Lopes . A Local Maxima Method and a Fair Dispersion Normalization for Extracting Multi-word Units from Corpora . In Proceedings of Meeting on Mathematics of Language (MOL) , pages 369 -- 381 , July 1999 . J. F. da Silva and J. G. P. Lopes. A Local Maxima Method and a Fair Dispersion Normalization for Extracting Multi-word Units from Corpora. In Proceedings of Meeting on Mathematics of Language (MOL), pages 369--381, July 1999."},{"key":"e_1_3_2_1_13_1","first-page":"20","volume-title":"Proceedings of ACM SIGKDD Workshop on Text Mining","author":"Dias G.","year":"2000","unstructured":"G. Dias . Mining Textual Associations in Text Corpora . In Proceedings of ACM SIGKDD Workshop on Text Mining , pages 20 -- 23 , Aug. 2000 . G. Dias. Mining Textual Associations in Text Corpora. In Proceedings of ACM SIGKDD Workshop on Text Mining, pages 20--23, Aug. 2000."},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.1137\/1.9781611972733.6"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.tcs.2011.12.002"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"publisher","DOI":"10.1145\/290941.290948"},{"key":"e_1_3_2_1_17_1","first-page":"841","volume-title":"Proceedings of ACM-SIAM Symposium on Discrete Algorithms (SODA)","author":"Grossi R.","year":"2003","unstructured":"R. Grossi , A. Gupta , and J. S. Vitter . High-Order Entropy-Compressed Text Indexes . In Proceedings of ACM-SIAM Symposium on Discrete Algorithms (SODA) , pages 841 -- 850 , 2003 . R. Grossi, A. Gupta, and J. S. Vitter. High-Order Entropy-Compressed Text Indexes. In Proceedings of ACM-SIAM Symposium on Discrete Algorithms (SODA), pages 841--850, 2003."},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1002\/asi.4630260402"},{"key":"e_1_3_2_1_19_1","first-page":"365","volume-title":"Proceedings of International Conference on Computational Linguistics (COLING)","author":"Hasan K. S.","year":"2010","unstructured":"K. S. Hasan and V. Ng . Conundrums in Unsupervised Keyphrase Extraction: Making Sense of the State-of-the-Art . In Proceedings of International Conference on Computational Linguistics (COLING) , pages 365 -- 373 , Aug. 2010 . K. S. Hasan and V. Ng. Conundrums in Unsupervised Keyphrase Extraction: Making Sense of the State-of-the-Art. In Proceedings of International Conference on Computational Linguistics (COLING), pages 365--373, Aug. 2010."},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1007\/s007999900025"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1108\/eb026526"},{"key":"e_1_3_2_1_22_1","volume-title":"On Tables of Random Numbers. Sankhy\\=a Ser. A, 25: 369--376","author":"Kolmogorov A.","year":"1963","unstructured":"A. Kolmogorov . On Tables of Random Numbers. Sankhy\\=a Ser. A, 25: 369--376 , 1963 . A. Kolmogorov. On Tables of Random Numbers. Sankhy\\=a Ser. A, 25:369--376, 1963."},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2008.110"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1147\/rd.53.0183"},{"key":"e_1_3_2_1_25_1","volume-title":"An Introduction to Kolmogorov Complexity and Its Applications","author":"Li M.","year":"2009","unstructured":"M. Li and P. M. Vit\u00e1nyi . An Introduction to Kolmogorov Complexity and Its Applications . Springer , Berlin , 3 rd edition, 2009 . M. Li and P. M. Vit\u00e1nyi. An Introduction to Kolmogorov Complexity and Its Applications. Springer, Berlin, 3rd edition, 2009.","edition":"3"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.5555\/1394399"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/1458082.1458137"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1145\/1963192.1963239"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.5555\/2394373.2394418"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1137\/1.9781611972795.72"},{"key":"e_1_3_2_1_31_1","first-page":"1037","volume-title":"Proceedings of International Conference on Language Resources and Evaluation (LREC)","author":"C.","year":"2004","unstructured":"C. Or\\uasan, V. Pekar , and L. Hasler . A Comparison of Summarisation Methods Based on Term Specificity Estimation . In Proceedings of International Conference on Language Resources and Evaluation (LREC) , pages 1037 -- 1041 , May 2004 . C. Or\\uasan, V. Pekar, and L. Hasler. A Comparison of Summarisation Methods Based on Term Specificity Estimation. In Proceedings of International Conference on Language Resources and Evaluation (LREC), pages 1037--1041, May 2004."},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.3115\/1073336.1073340"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"crossref","first-page":"13","DOI":"10.3115\/1628960.1628964","volume-title":"Proceedings of ACL Student Research Workshop","author":"Pecina P.","year":"2005","unstructured":"P. Pecina . An Extensive Empirical Study of Collocation Extraction Methods . In Proceedings of ACL Student Research Workshop , pages 13 -- 18 , June 2005 . P. Pecina. An Extensive Empirical Study of Collocation Extraction Methods. In Proceedings of ACL Student Research Workshop, pages 13--18, June 2005."},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICMLA.2006.50"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1145\/1076034.1076095"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1108\/00220410410560582"},{"key":"e_1_3_2_1_37_1","first-page":"109","volume-title":"Proceedings of Text Retrieval Conference (TREC)","author":"Robertson S.","year":"1994","unstructured":"S. Robertson , S. Walker , S. Jones , M. Hancock-Beaulieu , and M. Gatford . Okapi at TREC-3 . In Proceedings of Text Retrieval Conference (TREC) , pages 109 -- 126 , 1994 . S. Robertson, S. Walker, S. Jones, M. Hancock-Beaulieu, and M. Gatford. Okapi at TREC-3. In Proceedings of Text Retrieval Conference (TREC), pages 109--126, 1994."},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1145\/1390334.1390409"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1145\/2505515.2505671"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1145\/2348283.2348401"},{"key":"e_1_3_2_1_41_1","volume-title":"Introduction to Modern Information Retrieval","author":"Salton G.","year":"1983","unstructured":"G. Salton and M. J. McGill . Introduction to Modern Information Retrieval . McGraw-Hill , New York , 1983 . G. Salton and M. J. McGill. Introduction to Modern Information Retrieval. McGraw-Hill, New York, 1983."},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1145\/361219.361220"},{"key":"e_1_3_2_1_43_1","first-page":"100","volume-title":"Proceedings of Conference on Empirical Methods in Natural Language Processing (EMNLP)","author":"Schone P.","year":"2001","unstructured":"P. Schone and D. Jurafsky . Is Knowledge-Free Induction of Multiword Unit Dictionary Headwords a Solved Problem ? In Proceedings of Conference on Empirical Methods in Natural Language Processing (EMNLP) , pages 100 -- 108 , June 2001 . P. Schone and D. Jurafsky. Is Knowledge-Free Induction of Multiword Unit Dictionary Headwords a Solved Problem? In Proceedings of Conference on Empirical Methods in Natural Language Processing (EMNLP), pages 100--108, June 2001."},{"key":"e_1_3_2_1_44_1","doi-asserted-by":"publisher","DOI":"10.5555\/946247.946751"},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"publisher","DOI":"10.1145\/1361684.1361686"},{"key":"e_1_3_2_1_47_1","doi-asserted-by":"publisher","DOI":"10.1162\/089120101300346787"},{"key":"e_1_3_2_1_48_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2009.02.026"}],"event":{"name":"WWW '15: 24th International World Wide Web Conference","sponsor":["IW3C2 International World Wide Web Conference Committee","SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web"],"location":"Florence Italy","acronym":"WWW '15"},"container-title":["Proceedings of the 24th International Conference on World Wide Web"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2736277.2741628","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/2736277.2741628","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T06:12:29Z","timestamp":1750227149000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2736277.2741628"}},"subtitle":["A Global Term Weighting Scheme Based on Information Distance"],"short-title":[],"issued":{"date-parts":[[2015,5,18]]},"references-count":47,"alternative-id":["10.1145\/2736277.2741628","10.5555\/2736277"],"URL":"https:\/\/doi.org\/10.1145\/2736277.2741628","relation":{},"subject":[],"published":{"date-parts":[[2015,5,18]]},"assertion":[{"value":"2015-05-18","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}