{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,3]],"date-time":"2026-03-03T08:19:35Z","timestamp":1772525975910,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":39,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,3,4]],"date-time":"2024-03-04T00:00:00Z","timestamp":1709510400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,3,4]]},"DOI":"10.1145\/3616855.3635763","type":"proceedings-article","created":{"date-parts":[[2024,3,4]],"date-time":"2024-03-04T18:18:12Z","timestamp":1709576292000},"page":"529-537","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":5,"title":["A Linguistic Grounding-Infused Contrastive Learning Approach for Health Mention Classification on Social Media"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-0191-7171","authenticated-orcid":false,"given":"Usman","family":"Naseem","sequence":"first","affiliation":[{"name":"School of Computer Science, University of Sydney, Sydney, Australia"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5960-1060","authenticated-orcid":false,"given":"Jinmaan","family":"Kim","sequence":"additional","affiliation":[{"name":"School of Computer Science, University of Sydney, Sydney, Australia"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7792-2327","authenticated-orcid":false,"given":"Matloob","family":"Khush","sequence":"additional","affiliation":[{"name":"Department of Computer Science, Brunel University, London, United Kingdom"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1720-8209","authenticated-orcid":false,"given":"Adam G.","family":"Dunn","sequence":"additional","affiliation":[{"name":"School of Medical Sciences, University of Sydney, Sydney, Australia"}]}],"member":"320","published-online":{"date-parts":[[2024,3,4]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1145\/3543507.3583877"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1145\/3366423.3380198"},{"key":"e_1_3_2_1_3_1","volume-title":"Support-vector networks. Machine learning 20, 3","author":"Cortes Corinna","year":"1995","unstructured":"Corinna Cortes and Vladimir Vapnik. 1995. Support-vector networks. Machine learning 20, 3 (1995), 273--297."},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N19--1423"},{"key":"e_1_3_2_1_5_1","volume-title":"Self-training improves pre-training for natural language understanding. arXiv preprint arXiv:2010.02194","author":"Du Jingfei","year":"2020","unstructured":"Jingfei Du, Edouard Grave, Beliz Gunel, Vishrav Chaudhary, Onur Celebi, Michael Auli, Ves Stoyanov, and Alexis Conneau. 2020. Self-training improves pre-training for natural language understanding. arXiv preprint arXiv:2010.02194 (2020)."},{"key":"e_1_3_2_1_6_1","volume-title":"Proceedings of the 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies. 5408--5418","author":"Du Jingfei","year":"2021","unstructured":"Jingfei Du, \u00c9douard Grave, Beliz Gunel, Vishrav Chaudhary, Onur Celebi, Michael Auli, Veselin Stoyanov, and Alexis Conneau. 2021. Self-training Improves Pretraining for Natural Language Understanding. In Proceedings of the 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies. 5408--5418."},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00945"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.emnlp-main.552"},{"key":"e_1_3_2_1_9_1","first-page":"2009","article-title":"Twitter sentiment classification using distant supervision. CS224N project report","volume":"1","author":"Go Alec","year":"2009","unstructured":"Alec Go, Richa Bhayani, and Lei Huang. 2009. Twitter sentiment classification using distant supervision. CS224N project report, Stanford 1, 12 (2009), 2009.","journal-title":"Stanford"},{"key":"e_1_3_2_1_10_1","volume-title":"MIP: A method for identifying metaphorically used words in discourse. Metaphor and symbol 22, 1","author":"Pragglejaz Group","year":"2007","unstructured":"Pragglejaz Group. 2007. MIP: A method for identifying metaphorically used words in discourse. Metaphor and symbol 22, 1 (2007), 1--39."},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-39964-3_62"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.5555\/2002472.2002541"},{"key":"e_1_3_2_1_14_1","volume-title":"Figurative usage detection of symptom words to improve personal health mention detection. arXiv preprint arXiv:1906.05466","author":"Iyer Adith","year":"2019","unstructured":"Adith Iyer, Aditya Joshi, Sarvnaz Karimi, Ross Sparks, and Cecile Paris. 2019. Figurative usage detection of symptom words to improve personal health mention detection. arXiv preprint arXiv:1906.05466 (2019)."},{"key":"e_1_3_2_1_15_1","volume-title":"Identifying tweets of personal health experience through word embedding and LSTM neural network. BMC bioinformatics 19, 8","author":"Jiang Keyuan","year":"2018","unstructured":"Keyuan Jiang, Shichao Feng, Qunhao Song, Ricardo A Calix, Matrika Gupta, and Gordon R Bernard. 2018. Identifying tweets of personal health experience through word embedding and LSTM neural network. BMC bioinformatics 19, 8 (2018), 210."},{"key":"e_1_3_2_1_16_1","volume-title":"Identifying consumer health terms of side effects in Twitter posts. Studies in health technology and informatics 251","author":"Jiang Keyuan","year":"2018","unstructured":"Keyuan Jiang, CHEN Tingyu, Ricardo A Calix, and Gordon R Bernard. 2018. Identifying consumer health terms of side effects in Twitter posts. Studies in health technology and informatics 251 (2018), 273."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.naacl-main.66"},{"key":"e_1_3_2_1_18_1","volume-title":"Proceedings of the 2018 World Wide Web Conference. 137--146","author":"Karisani Payam","year":"2018","unstructured":"Payam Karisani and Eugene Agichtein. 2018. Did you really just have a heart attack? Towards robust detection of personal health mentions in social media. In Proceedings of the 2018 World Wide Web Conference. 137--146."},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1145\/3366423.3380304"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1109\/TCSS.2022.3143768"},{"key":"e_1_3_2_1_21_1","volume-title":"Proceedings of the 2013 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies. 789--795","author":"Lamb Alex","year":"2013","unstructured":"Alex Lamb, Michael Paul, and Mark Dredze. 2013. Separating fact from fear: Tracking flu infections on twitter. In Proceedings of the 2013 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies. 789--795."},{"key":"e_1_3_2_1_22_1","volume-title":"Workshop on challenges in representation learning, ICML","volume":"3","author":"Dong-Hyun","unstructured":"Dong-Hyun Lee et al. 2013. Pseudo-label: The simple and efficient semisupervised learning method for deep neural networks. In Workshop on challenges in representation learning, ICML, Vol. 3. 896."},{"key":"e_1_3_2_1_23_1","volume-title":"Chan Ho So, and Jaewoo Kang","author":"Lee Jinhyuk","year":"2019","unstructured":"Jinhyuk Lee, Wonjin Yoon, Sungdong Kim, Donghyeon Kim, Sunkyu Kim, Chan Ho So, and Jaewoo Kang. 2019. BioBERT: a pre-trained biomedical language representation model for biomedical text mining. arXiv:1901.08746 [cs.CL]"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.emnlp-main.316"},{"key":"e_1_3_2_1_25_1","unstructured":"Yinhan Liu Myle Ott Naman Goyal Jingfei Du Mandar Joshi Danqi Chen Omer Levy Mike Lewis Luke Zettlemoyer and Veselin Stoyanov. 2019. RoBERTa: A Robustly Optimized BERT Pretraining Approach. arXiv:1907.11692 [cs.CL]"},{"key":"e_1_3_2_1_26_1","volume-title":"Supervised Momentum Contrastive Learning for Few-Shot Classification. arXiv preprint arXiv:2101.11058","author":"Majumder Orchid","year":"2021","unstructured":"Orchid Majumder, Avinash Ravichandran, Subhransu Maji, Alessandro Achille, Marzia Polito, and Stefano Soatto. 2021. Supervised Momentum Contrastive Learning for Few-Shot Classification. arXiv preprint arXiv:2101.11058 (2021)."},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.5555\/1690219.1690287"},{"key":"e_1_3_2_1_28_1","volume-title":"COVID-TwitterBERT: A Natural Language Processing Model to Analyse COVID-19 Content on Twitter. arXiv preprint arXiv:2005.07503","author":"M\u00fcller Martin","year":"2020","unstructured":"Martin M\u00fcller, Marcel Salath\u00e9, and Per E Kummervold. 2020. COVID-TwitterBERT: A Natural Language Processing Model to Analyse COVID-19 Content on Twitter. arXiv preprint arXiv:2005.07503 (2020)."},{"key":"e_1_3_2_1_29_1","volume-title":"RHMD: a real-world dataset for health mention classification on Reddit","author":"Naseem Usman","year":"2022","unstructured":"Usman Naseem, Matloob Khushi, Jinman Kim, and Adam G Dunn. 2022. RHMD: a real-world dataset for health mention classification on Reddit. IEEE Transactions on Computational Social Systems (2022)."},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1145\/3485447.3512129"},{"key":"e_1_3_2_1_31_1","volume-title":"Robust Identification of Figurative Language in Personal Health Mentions on Twitter","author":"Naseem Usman","year":"2022","unstructured":"Usman Naseem, Jinman Kim, Matloob Khushi, and Adam G Dunn. 2022. Robust Identification of Figurative Language in Personal Health Mentions on Twitter. IEEE Transactions on Artificial Intelligence (2022)."},{"key":"e_1_3_2_1_32_1","first-page":"22","article-title":"Benchmarking for Public Health Surveillance tasks on Social Media with a Domain-Specific Pretrained Language Model","volume":"2022","author":"Naseem Usman","year":"2022","unstructured":"Usman Naseem, Byoung Chan Lee, Matloob Khushi, Jinman Kim, and Adam G Dunn. 2022. Benchmarking for Public Health Surveillance tasks on Social Media with a Domain-Specific Pretrained Language Model. NLP-Power 2022 (2022), 22.","journal-title":"NLP-Power"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.1007\/s13278-023-01167-9"},{"key":"e_1_3_2_1_34_1","volume-title":"To tune or not to tune? adapting pretrained representations to diverse tasks. arXiv preprint arXiv:1903.05987","author":"Peters Matthew E","year":"2019","unstructured":"Matthew E Peters, Sebastian Ruder, and Noah A Smith. 2019. To tune or not to tune? adapting pretrained representations to diverse tasks. arXiv preprint arXiv:1903.05987 (2019)."},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"crossref","unstructured":"Chuck Rosenberg Martial Hebert and Henry Schneiderman. 2005. Semisupervised self-training of object detection models. (2005).","DOI":"10.1109\/ACVMOT.2005.107"},{"key":"e_1_3_2_1_36_1","volume-title":"A survey of decision tree classifier methodology","author":"Rasoul Safavian S","year":"1991","unstructured":"S Rasoul Safavian and David Landgrebe. 1991. A survey of decision tree classifier methodology. IEEE transactions on systems, man, and cybernetics 21, 3 (1991), 660--674."},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.3115\/v1\/P14-1024"},{"key":"e_1_3_2_1_38_1","first-page":"6256","article-title":"Unsupervised data augmentation for consistency training","volume":"33","author":"Xie Qizhe","year":"2020","unstructured":"Qizhe Xie, Zihang Dai, Eduard Hovy, Thang Luong, and Quoc Le. 2020. Unsupervised data augmentation for consistency training. Advances in Neural Information Processing Systems 33 (2020), 6256--6268.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.naacl-main.84"}],"event":{"name":"WSDM '24: The 17th ACM International Conference on Web Search and Data Mining","location":"Merida Mexico","acronym":"WSDM '24","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web","SIGKDD ACM Special Interest Group on Knowledge Discovery in Data","SIGIR ACM Special Interest Group on Information Retrieval"]},"container-title":["Proceedings of the 17th ACM International Conference on Web Search and Data Mining"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3616855.3635763","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3616855.3635763","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T00:51:07Z","timestamp":1755823867000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3616855.3635763"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,3,4]]},"references-count":39,"alternative-id":["10.1145\/3616855.3635763","10.1145\/3616855"],"URL":"https:\/\/doi.org\/10.1145\/3616855.3635763","relation":{},"subject":[],"published":{"date-parts":[[2024,3,4]]},"assertion":[{"value":"2024-03-04","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}