{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,30]],"date-time":"2025-10-30T01:54:33Z","timestamp":1761789273074,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":64,"publisher":"ACM","license":[{"start":{"date-parts":[[2015,9,28]],"date-time":"2015-09-28T00:00:00Z","timestamp":1443398400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2015,9,28]]},"DOI":"10.1145\/2815782.2815789","type":"proceedings-article","created":{"date-parts":[[2015,12,18]],"date-time":"2015-12-18T14:32:43Z","timestamp":1450449163000},"page":"1-10","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":1,"title":["N-Gram Representations For Comment Filtering"],"prefix":"10.1145","author":[{"given":"Dirk","family":"Brand","sequence":"first","affiliation":[{"name":"Computer Science Division, Stellenbosch University"}]},{"given":"Steve","family":"Kroon","sequence":"additional","affiliation":[{"name":"Computer Science Division, Stellenbosch University"}]},{"given":"Brink","family":"van der Merwe","sequence":"additional","affiliation":[{"name":"Computer Science Division, Stellenbosch University"}]},{"given":"Loek","family":"Cleophas","sequence":"additional","affiliation":[{"name":"Dept. of Computing Science, Ume\u00e5 University, Dept. of Information Science, Stellenbosch University"}]}],"member":"320","published-online":{"date-parts":[[2015,9,28]]},"reference":[{"doi-asserted-by":"publisher","key":"e_1_3_2_1_1_1","DOI":"10.1145\/1341531.1341557"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_2_1","DOI":"10.1016\/S0306-4573(02)00021-3"},{"unstructured":"A. U. Alvarez. Bad words list. http:\/\/urbanoalvarez.es\/blog\/2008\/04\/04\/bad-words-list\/. Accessed: March 2014.  A. U. Alvarez. Bad words list. http:\/\/urbanoalvarez.es\/blog\/2008\/04\/04\/bad-words-list\/. Accessed: March 2014.","key":"e_1_3_2_1_3_1"},{"key":"e_1_3_2_1_4_1","first-page":"7","volume-title":"System Sciences, 2003. Proceedings of the 36th Annual Hawaii International Conference on","author":"Basu A.","unstructured":"A. Basu , C. Walters , and M. Shepherd . Support vector machines for text categorization . In System Sciences, 2003. Proceedings of the 36th Annual Hawaii International Conference on , pages 7 --pp. IEEE, 2003. A. Basu, C. Walters, and M. Shepherd. Support vector machines for text categorization. In System Sciences, 2003. Proceedings of the 36th Annual Hawaii International Conference on, pages 7--pp. IEEE, 2003."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_5_1","DOI":"10.5555\/944919.944966"},{"key":"e_1_3_2_1_6_1","first-page":"281","volume":"13","author":"Bergstra J.","year":"2012","unstructured":"J. Bergstra and Y. Bengio . Random Search for Hyper-Parameter Optimization. Journal of Machine Learning Research , 13 : 281 -- 305 , 2012 . J. Bergstra and Y. Bengio. Random Search for Hyper-Parameter Optimization. Journal of Machine Learning Research, 13:281--305, 2012.","journal-title":"Journal of Machine Learning Research"},{"key":"e_1_3_2_1_7_1","volume-title":"Natural language processing with Python","author":"Bird S.","year":"2009","unstructured":"S. Bird , E. Klein , and E. Loper . Natural language processing with Python . O'Reilly Media, Inc. , 2009 . S. Bird, E. Klein, and E. Loper. Natural language processing with Python. O'Reilly Media, Inc., 2009."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_8_1","DOI":"10.5555\/1296233"},{"key":"e_1_3_2_1_9_1","volume-title":"https:\/\/github.com\/DirkBrand\/Comment-Classification","author":"Brand D.","year":"2015","unstructured":"D. Brand . Comment Classification . https:\/\/github.com\/DirkBrand\/Comment-Classification , 2015 . D. Brand. Comment Classification. https:\/\/github.com\/DirkBrand\/Comment-Classification, 2015."},{"key":"e_1_3_2_1_10_1","first-page":"50","volume-title":"Proceedings of the first International Conference on the use of Mobile Informations and Communication Technology (ICT) in Africa","author":"Brand D.","year":"2014","unstructured":"D. Brand and B. van der Merwe. Comment Classification for an Online News Domain . In Proceedings of the first International Conference on the use of Mobile Informations and Communication Technology (ICT) in Africa , pages 50 -- 56 . UMICTA, ACM, 2014 . D. Brand and B. van der Merwe. Comment Classification for an Online News Domain. In Proceedings of the first International Conference on the use of Mobile Informations and Communication Technology (ICT) in Africa, pages 50--56. UMICTA, ACM, 2014."},{"key":"e_1_3_2_1_11_1","volume-title":"Proceedings of the Joint Conference on Empirical Methods in Natural Language Processing and Computational Natural Language Learning. Citeseer","author":"Brants T.","year":"2007","unstructured":"T. Brants , A. C. Popat , P. Xu , F. J. Och , and J. Dean . Large language models in machine translation . In Proceedings of the Joint Conference on Empirical Methods in Natural Language Processing and Computational Natural Language Learning. Citeseer , 2007 . T. Brants, A. C. Popat, P. Xu, F. J. Och, and J. Dean. Large language models in machine translation. In Proceedings of the Joint Conference on Empirical Methods in Natural Language Processing and Computational Natural Language Learning. Citeseer, 2007."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_12_1","DOI":"10.1016\/B978-1-55860-335-6.50012-X"},{"key":"e_1_3_2_1_13_1","volume-title":"Proceedings of SDAIR-94","author":"Cavnar W. B.","year":"1994","unstructured":"W. B. Cavnar and J. M. Trenkle . N-Gram-Based Text Categorization . In Proceedings of SDAIR-94 , 3rd Annual Symposium on Document Analysis and Information Retrieval, pages 161--175 , 1994 . W. B. Cavnar and J. M. Trenkle. N-Gram-Based Text Categorization. In Proceedings of SDAIR-94, 3rd Annual Symposium on Document Analysis and Information Retrieval, pages 161--175, 1994."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_14_1","DOI":"10.1145\/2020408.2020439"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_15_1","DOI":"10.5555\/2283696.2283700"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_16_1","DOI":"10.1075\/ijcl.11.4.04che"},{"key":"e_1_3_2_1_17_1","first-page":"687","volume-title":"Artificial Neural Networks - ICANN","author":"Cherkassky V.","year":"2002","unstructured":"V. Cherkassky and Y. Ma . Selection of meta-parameters for support vector regression . In Artificial Neural Networks - ICANN , pages 687 -- 693 . Springer , 2002 . V. Cherkassky and Y. Ma. Selection of meta-parameters for support vector regression. In Artificial Neural Networks - ICANN, pages 687--693. Springer, 2002."},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"crossref","DOI":"10.1017\/CBO9780511801389","volume-title":"An introduction to support vector machines and other kernel-based learning methods","author":"Cristianini N.","year":"2000","unstructured":"N. Cristianini and J. Shawe-Taylor . An introduction to support vector machines and other kernel-based learning methods . Cambridge university Press , 2000 . N. Cristianini and J. Shawe-Taylor. An introduction to support vector machines and other kernel-based learning methods. Cambridge university Press, 2000."},{"unstructured":"H. Daum\u00e9 III. A Course in Machine Learning. http:\/\/ciml.info 2012.  H. Daum\u00e9 III. A Course in Machine Learning. http:\/\/ciml.info 2012.","key":"e_1_3_2_1_19_1"},{"key":"e_1_3_2_1_20_1","volume-title":"N-grams in Texts Categorization","author":"Elberrichi Z.","year":"2007","unstructured":"Z. Elberrichi and B. Aljohar . N-grams in Texts Categorization . Scientific Journal of King Faisal University (Basic and Applied Sciences) , 8(2):25--39, 2007 . Z. Elberrichi and B. Aljohar. N-grams in Texts Categorization. Scientific Journal of King Faisal University (Basic and Applied Sciences), 8(2):25--39, 2007."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_21_1","DOI":"10.1037\/h0057532"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_22_1","DOI":"10.5555\/3120676.3120728"},{"key":"e_1_3_2_1_23_1","volume-title":"ISIS technical report, 14","author":"Gunn S. R.","year":"1998","unstructured":"S. R. Gunn . Support Vector Machines for Classification and Regression. ISIS technical report, 14 , 1998 . S. R. Gunn. Support Vector Machines for Classification and Regression. ISIS technical report, 14, 1998."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_24_1","DOI":"10.1007\/s00500-005-0503-y"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_25_1","DOI":"10.5555\/944919.944968"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_26_1","DOI":"10.1109\/TIT.2002.805090"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_27_1","DOI":"10.1007\/978-3-540-85845-4_9"},{"key":"e_1_3_2_1_28_1","volume-title":"Learning multiple layers of representation. Trends in cognitive sciences, 11(10):428--434","author":"Hinton G. E.","year":"2007","unstructured":"G. E. Hinton . Learning multiple layers of representation. Trends in cognitive sciences, 11(10):428--434 , 2007 . G. E. Hinton. Learning multiple layers of representation. Trends in cognitive sciences, 11(10):428--434, 2007."},{"key":"e_1_3_2_1_29_1","volume-title":"IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings","volume":"4","author":"Hirsim\u00e4ki T.","year":"2007","unstructured":"T. Hirsim\u00e4ki . On compressing N-gram language models. In ICASSP , IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings , volume 4 , 2007 . T. Hirsim\u00e4ki. On compressing N-gram language models. In ICASSP, IEEE International Conference on Acoustics, Speech and Signal Processing - Proceedings, volume 4, 2007."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_30_1","DOI":"10.1109\/CSE.2009.109"},{"issue":"1","key":"e_1_3_2_1_31_1","first-page":"1396","article-title":"A Practical Guide to Support Vector Classification","volume":"101","author":"Hsu C. W.","year":"2008","unstructured":"C. W. Hsu , C. C. Chang , and C. J. Lin . A Practical Guide to Support Vector Classification . BJU international , 101 ( 1 ): 1396 -- 1400 , 2008 . C. W. Hsu, C. C. Chang, and C. J. Lin. A Practical Guide to Support Vector Classification. BJU international, 101(1):1396--400, 2008.","journal-title":"BJU international"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_32_1","DOI":"10.5555\/645326.649721"},{"key":"e_1_3_2_1_33_1","volume-title":"SciPy: Open source scientific tools for Python","author":"Jones E.","year":"2014","unstructured":"E. Jones , T. Oliphant , and P. Peterson . SciPy: Open source scientific tools for Python , 2014 . E. Jones, T. Oliphant, and P. Peterson. SciPy: Open source scientific tools for Python, 2014."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_34_1","DOI":"10.1145\/345966.345982"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_35_1","DOI":"10.1145\/985692.985761"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_36_1","DOI":"10.1162\/153244302760200687"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_37_1","DOI":"10.4324\/9780203137802"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_38_1","DOI":"10.1147\/rd.22.0159"},{"key":"e_1_3_2_1_39_1","first-page":"1","volume-title":"Proceedings of the International Conference on Learning Representations (ICLR 2013","author":"Mikolov T.","year":"2013","unstructured":"T. Mikolov , G. Corrado , K. Chen , and J. Dean . Efficient Estimation of Word Representations in Vector Space . Proceedings of the International Conference on Learning Representations (ICLR 2013 ), pages 1 -- 12 , 2013 . T. Mikolov, G. Corrado, K. Chen, and J. Dean. Efficient Estimation of Word Representations in Vector Space. Proceedings of the International Conference on Learning Representations (ICLR 2013), pages 1--12, 2013."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_40_1","DOI":"10.1145\/219717.219748"},{"key":"e_1_3_2_1_41_1","first-page":"19","volume-title":"Proceedings of ACM SIGIR 2005 Workshop on Stylistic Analysis of Text for Information Access","author":"Mishne G.","year":"2005","unstructured":"G. Mishne . Experiments with mood classification in blog posts . Proceedings of ACM SIGIR 2005 Workshop on Stylistic Analysis of Text for Information Access , page 19 , 2005 . G. Mishne. Experiments with mood classification in blog posts. Proceedings of ACM SIGIR 2005 Workshop on Stylistic Analysis of Text for Information Access, page 19, 2005."},{"key":"e_1_3_2_1_42_1","first-page":"1081","volume-title":"Advances in neural information processing systems","author":"Mnih A.","year":"2009","unstructured":"A. Mnih and G. E. Hinton . A scalable hierarchical distributed language model . In Advances in neural information processing systems , pages 1081 -- 1088 , 2009 . A. Mnih and G. E. Hinton. A scalable hierarchical distributed language model. In Advances in neural information processing systems, pages 1081--1088, 2009."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_43_1","DOI":"10.1016\/j.knosys.2009.11.004"},{"key":"e_1_3_2_1_44_1","volume-title":"The PageRank citation ranking: Bringing order to the web","author":"Page L.","year":"1999","unstructured":"L. Page , S. Brin , R. Motwani , and T. Winograd . The PageRank citation ranking: Bringing order to the web . 1999 . L. Page, S. Brin, R. Motwani, and T. Winograd. The PageRank citation ranking: Bringing order to the web. 1999."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_45_1","DOI":"10.5555\/1953048.2078195"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_46_1","DOI":"10.1145\/1367497.1367510"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_47_1","DOI":"10.1002\/(SICI)1097-4571(198609)37:5<279::AID-ASI1>3.0.CO;2-Q"},{"unstructured":"Ranks.nl. Default english stopwords list. http:\/\/www.ranks.nl\/stopwords. Accessed: July 2014.  Ranks.nl. Default english stopwords list. http:\/\/www.ranks.nl\/stopwords. Accessed: July 2014.","key":"e_1_3_2_1_48_1"},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"crossref","first-page":"405","DOI":"10.1007\/978-3-642-21064-8_28","volume-title":"The Semanic Web: Research and Applications","author":"Rowe M.","year":"2011","unstructured":"M. Rowe , S. Angeletou , and H. Alani . Predicting discussions on the social semantic web . In The Semanic Web: Research and Applications , pages 405 -- 420 . Springer , 2011 . M. Rowe, S. Angeletou, and H. Alani. Predicting discussions on the social semantic web. In The Semanic Web: Research and Applications, pages 405--420. Springer, 2011."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_50_1","DOI":"10.1145\/544741.544854"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_51_1","DOI":"10.1016\/0306-4573(88)90021-0"},{"key":"e_1_3_2_1_52_1","volume-title":"Introduction to Modern Information Retrieval","author":"Salton G.","year":"1986","unstructured":"G. Salton and M. J. McGill . Introduction to Modern Information Retrieval . McGraw-Hill, Inc. , 1986 . G. Salton and M. J. McGill. Introduction to Modern Information Retrieval. McGraw-Hill, Inc., 1986."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_53_1","DOI":"10.1145\/361219.361220"},{"unstructured":"N. Shuyo. Language Detection Library for Java 2010.  N. Shuyo. Language Detection Library for Java 2010.","key":"e_1_3_2_1_54_1"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_55_1","DOI":"10.1007\/978-3-642-37798-3_1"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_56_1","DOI":"10.4304\/jmm.9.5.635-643"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_57_1","DOI":"10.1145\/1835449.1835643"},{"key":"e_1_3_2_1_58_1","volume-title":"Feature Selection for Classification: A Review. Data Classification: Algorithms and Applications, page 37","author":"Tang J.","year":"2014","unstructured":"J. Tang , S. Alelyani , and H. Liu . Feature Selection for Classification: A Review. Data Classification: Algorithms and Applications, page 37 , 2014 . J. Tang, S. Alelyani, and H. Liu. Feature Selection for Classification: A Review. Data Classification: Algorithms and Applications, page 37, 2014."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_59_1","DOI":"10.1016\/j.cmpb.2005.11.007"},{"unstructured":"Tryolabs. Reddit's new comment sorting system. http:\/\/www.tryolabs.com\/. Accessed: February 2014.  Tryolabs. Reddit's new comment sorting system. http:\/\/www.tryolabs.com\/. Accessed: February 2014.","key":"e_1_3_2_1_60_1"},{"key":"e_1_3_2_1_61_1","first-page":"1","article-title":"A Comparative Review","volume":"10","author":"van der Maaten L.","year":"2009","unstructured":"L. van der Maaten , E. Postma , and J. van den Herik . Dimensionality Reduction : A Comparative Review . Journal of Machine Learning Research , 10 : 1 -- 41 , 2009 . L. van der Maaten, E. Postma, and J. van den Herik. Dimensionality Reduction: A Comparative Review. Journal of Machine Learning Research, 10:1--41, 2009.","journal-title":"Journal of Machine Learning Research"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_62_1","DOI":"10.5555\/211359"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_63_1","DOI":"10.1145\/1458527.1458534"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_64_1","DOI":"10.5555\/1557769.1557806"}],"event":{"acronym":"SAICSIT '15","name":"SAICSIT '15: The 2015 Annual Research Conference of the South African Institute of Computer Scientists and Information Technologists","location":"Stellenbosch South Africa"},"container-title":["Proceedings of the 2015 Annual Research Conference on South African Institute of Computer Scientists and Information Technologists"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2815782.2815789","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/2815782.2815789","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T05:48:22Z","timestamp":1750225702000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/2815782.2815789"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2015,9,28]]},"references-count":64,"alternative-id":["10.1145\/2815782.2815789","10.1145\/2815782"],"URL":"https:\/\/doi.org\/10.1145\/2815782.2815789","relation":{},"subject":[],"published":{"date-parts":[[2015,9,28]]},"assertion":[{"value":"2015-09-28","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}