{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,14]],"date-time":"2025-06-14T19:10:09Z","timestamp":1749928209828,"version":"3.41.0"},"publisher-location":"Singapore","reference-count":42,"publisher":"Springer Nature Singapore","isbn-type":[{"value":"9789819681693","type":"print"},{"value":"9789819681709","type":"electronic"}],"license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-981-96-8170-9_36","type":"book-chapter","created":{"date-parts":[[2025,6,14]],"date-time":"2025-06-14T18:50:39Z","timestamp":1749927039000},"page":"461-477","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Modeling Data Diversity for\u00a0Joint Instance and\u00a0Verbalizer Selection in\u00a0Cold-Start Scenarios"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-3112-7445","authenticated-orcid":false,"given":"Mohna","family":"Chakraborty","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4625-4212","authenticated-orcid":false,"given":"Adithya","family":"Kulkarni","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3136-2157","authenticated-orcid":false,"given":"Qi","family":"Li","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,6,15]]},"reference":[{"key":"36_CR1","unstructured":"Achiam, J., et\u00a0al.: Gpt-4 technical report. arXiv preprint arXiv:2303.08774 (2023)"},{"key":"36_CR2","doi-asserted-by":"publisher","unstructured":"Chakraborty, M., Kulkarni, A., Li, Q.: Open-domain aspect-opinion co-mining with double-layer span extraction. In: Proceedings of the 28th ACM SIGKDD Conference on Knowledge Discovery and Data Mining, KDD \u201922, pp. 66\u201375. Association for Computing Machinery, New York (2022). https:\/\/doi.org\/10.1145\/3534678.3539386","DOI":"10.1145\/3534678.3539386"},{"key":"36_CR3","doi-asserted-by":"crossref","unstructured":"Chakraborty, M., Kulkarni, A., Li, Q.: Zero-shot approach to overcome perturbation sensitivity of prompts. In: Proceedings of the 61st Annual Meeting of the Association for Computational Linguistics, vol. 1: Long Papers, pp. 5698\u20135711 (2023)","DOI":"10.18653\/v1\/2023.acl-long.313"},{"key":"36_CR4","doi-asserted-by":"crossref","unstructured":"Chang, E., Shen, X., Yeh, H.S., Demberg, V.: On training instance selection for few-shot neural text generation. In: Proceedings of the 59th Annual Meeting of the ACL and the 11th IJCNLP, vol. 2: Short Papers, pp. 8\u201313 (2021)","DOI":"10.18653\/v1\/2021.acl-short.2"},{"key":"36_CR5","doi-asserted-by":"crossref","unstructured":"Cui, G., Hu, S., Ding, N., Huang, L., Liu, Z.: Prototypical verbalizer for prompt-based few-shot tuning. In: Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics, vol. 1: Long Papers, pp. 7014\u20137024 (2022)","DOI":"10.18653\/v1\/2022.acl-long.483"},{"key":"36_CR6","doi-asserted-by":"crossref","unstructured":"Gao, T., Fisch, A., Chen, D.: Making pre-trained language models better few-shot learners. In: Proceedings of the 59th Annual Meeting of the ACL and the 11th IJCNLP, vol. 1: Long Papers, pp. 3816\u20133830 (2021)","DOI":"10.18653\/v1\/2021.acl-long.295"},{"key":"36_CR7","unstructured":"Hacohen, G., Dekel, A., Weinshall, D.: Active learning on a budget: opposite strategies suit high and low budgets. In: International Conference on Machine Learning, pp. 8175\u20138195. PMLR (2022)"},{"key":"36_CR8","doi-asserted-by":"crossref","unstructured":"Hambardzumyan, K., Khachatrian, H., May, J.: Warp: word-level adversarial reprogramming. In: Proceedings of the 59th Annual Meeting of the ACL and the 11th IJCNLP, vol. 1: Long Papers, pp. 4921\u20134933 (2021)","DOI":"10.18653\/v1\/2021.acl-long.381"},{"key":"36_CR9","doi-asserted-by":"crossref","unstructured":"Hu, M., Liu, B.: Mining and summarizing customer reviews. In: Proceedings of the tenth ACM SIGKDD International Conference on Knowledge Discovery and Data Mining, pp. 168\u2013177 (2004)","DOI":"10.1145\/1014052.1014073"},{"key":"36_CR10","doi-asserted-by":"crossref","unstructured":"Hu, S., Ding, N., et\u00a0al.: Knowledgeable prompt-tuning: incorporating knowledge into prompt verbalizer for text classification. In: Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics, vol. 1: Long Papers, pp. 2225\u20132240 (2022)","DOI":"10.18653\/v1\/2022.acl-long.158"},{"key":"36_CR11","unstructured":"Kulkarni, A., Chakraborty, M., Xie, S., Li, Q.: Optimal budget allocation for crowdsourcing labels for graphs. In: Evans, R.J., Shpitser, I. (eds.) Proceedings of the Thirty-Ninth Conference on Uncertainty in Artificial Intelligence. Proceedings of Machine Learning Research, vol.\u00a0216, pp. 1154\u20131163. PMLR (2023)"},{"key":"36_CR12","doi-asserted-by":"crossref","unstructured":"Lester, B., Al-Rfou, R., Constant, N.: The power of scale for parameter-efficient prompt tuning. In: Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing. Association for Computational Linguistics (2021)","DOI":"10.18653\/v1\/2021.emnlp-main.243"},{"key":"36_CR13","doi-asserted-by":"crossref","unstructured":"Lewis, D.D., Gale, W.A.: A sequential algorithm for training text classifiers. In: Proceedings of the 17th Annual International ACM SIGIR Conference on Research and Development in Information Retrieval, pp. 3\u201312 (1994)","DOI":"10.1007\/978-1-4471-2099-5_1"},{"key":"36_CR14","doi-asserted-by":"crossref","unstructured":"Li, X.L., Liang, P.: Prefix-tuning: optimizing continuous prompts for generation. In: Proceedings of the 59th Annual Meeting of the ACL and the 11th IJCNLP, vol. 1: Long Papers, pp. 4582\u20134597 (2021)","DOI":"10.18653\/v1\/2021.acl-long.353"},{"key":"36_CR15","doi-asserted-by":"crossref","unstructured":"Liu, C., Wang, H., Xi, N., Zhao, S., Qin, B.: Global prompt cell: a portable control module for effective prompt tuning. In: CCF International Conference on Natural Language Processing and Chinese Computing, pp. 657\u2013668 (2023)","DOI":"10.1007\/978-3-031-44693-1_51"},{"key":"36_CR16","doi-asserted-by":"crossref","unstructured":"Liu, J., Shen, D., et\u00a0al.: What makes good in-context examples for gpt-3? In: Proceedings of Deep Learning Inside Out (DeeLIO 2022): The 3rd Workshop on Knowledge Extraction and Integration for Deep Learning Architectures, pp. 100\u2013114 (2022)","DOI":"10.18653\/v1\/2022.deelio-1.10"},{"key":"36_CR17","doi-asserted-by":"crossref","unstructured":"Liu, X., Zheng, Y., Du, Z., et\u00a0al.: Gpt understands, too. AI Open (2023)","DOI":"10.1016\/j.aiopen.2023.08.012"},{"key":"36_CR18","unstructured":"Liu, Y., Ott, M., et\u00a0al.: Roberta: a robustly optimized bert pretraining approach. arXiv preprint arXiv:1907.11692 (2019)"},{"key":"36_CR19","unstructured":"Maas, A., Daly, R.E., et\u00a0al.: Learning word vectors for sentiment analysis. In: Proceedings of the 49th Annual Meeting of the Association for Computational Linguistics: Human Language Technologies, pp. 142\u2013150 (2011)"},{"key":"36_CR20","unstructured":"MacQueen, J.: Some methods for classification and analysis of multivariate observations. In: Proceedings of 5-th Berkeley Symposium on Mathematical Statistics and Probability\/University of California Press (1967)"},{"key":"36_CR21","doi-asserted-by":"crossref","unstructured":"Margatina, K., Vernikos, G., Barrault, L., Aletras, N.: Active learning by acquiring contrastive examples. In: Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing, pp. 650\u2013663 (2021)","DOI":"10.18653\/v1\/2021.emnlp-main.51"},{"key":"36_CR22","doi-asserted-by":"crossref","unstructured":"Meng, Y., Shen, J., Zhang, C., Han, J.: Weakly-supervised hierarchical text classification. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol.\u00a033, pp. 6826\u20136833 (2019)","DOI":"10.1609\/aaai.v33i01.33016826"},{"key":"36_CR23","doi-asserted-by":"crossref","unstructured":"M\u00fcller, T., P\u00e9rez-Torr\u00f3, G., Basile, A., et\u00a0al.: Active few-shot learning with fasl. In: International Conference on Applications of Natural Language to Information Systems, pp. 98\u2013110 (2022)","DOI":"10.1007\/978-3-031-08473-7_9"},{"key":"36_CR24","doi-asserted-by":"crossref","unstructured":"PANG, B.: Thumbs up? sentiment classification using machine learning techniques. In: Proceedings of the Conference on Empirical Methods in Natural Language Processing (EMNLP) 2002 (2002)","DOI":"10.3115\/1118693.1118704"},{"key":"36_CR25","doi-asserted-by":"crossref","unstructured":"PANG, B.: A sentimental education: sentiment analysis using subjectivity summarization based on minimum cuts. In: Proceedings of the 42nd Meeting of the Association for Computational Linguistics (ACL) 2004 (2004)","DOI":"10.3115\/1218955.1218990"},{"key":"36_CR26","doi-asserted-by":"publisher","first-page":"53","DOI":"10.1016\/0377-0427(87)90125-7","volume":"20","author":"PJ Rousseeuw","year":"1987","unstructured":"Rousseeuw, P.J.: Silhouettes: a graphical aid to the interpretation and validation of cluster analysis. J. Comput. Appl. Math. 20, 53\u201365 (1987)","journal-title":"J. Comput. Appl. Math."},{"key":"36_CR27","doi-asserted-by":"crossref","unstructured":"Schick, T., Schmid, H., Sch\u00fctze, H.: Automatically identifying words that can serve as labels for few-shot text classification. In: Proceedings of the 28th International Conference on Computational Linguistics, pp. 5569\u20135578 (2020)","DOI":"10.18653\/v1\/2020.coling-main.488"},{"key":"36_CR28","doi-asserted-by":"crossref","unstructured":"Schick, T., Sch\u00fctze, H.: Exploiting cloze-questions for few-shot text classification and natural language inference. In: Proceedings of the 16th Conference of the European Chapter of the Association for Computational Linguistics: Main Volume, pp. 255\u2013269 (2021)","DOI":"10.18653\/v1\/2021.eacl-main.20"},{"key":"36_CR29","doi-asserted-by":"crossref","unstructured":"Schick, T., Sch\u00fctze, H.: It\u2019s not just size that matters: small language models are also few-shot learners. In: Proceedings of the 2021 NAACL-HLT, pp. 2339\u20132352 (2021)","DOI":"10.18653\/v1\/2021.naacl-main.185"},{"key":"36_CR30","doi-asserted-by":"crossref","unstructured":"Schr\u00f6der, C., Niekler, A., Potthast, M.: Revisiting uncertainty-based query strategies for active learning with transformers. In: Findings of the ACL: ACL 2022, pp. 2194\u20132203 (2022)","DOI":"10.18653\/v1\/2022.findings-acl.172"},{"key":"36_CR31","unstructured":"Sener, O., Savarese, S.: Active learning for convolutional neural networks: a core-set approach. In: International Conference on Learning Representations (2018)"},{"key":"36_CR32","doi-asserted-by":"crossref","unstructured":"Shin, T., Razeghi, Y., et\u00a0al.: Autoprompt: eliciting knowledge from language models with automatically generated prompts. In: Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP), pp. 4222\u20134235 (2020)","DOI":"10.18653\/v1\/2020.emnlp-main.346"},{"key":"36_CR33","doi-asserted-by":"crossref","unstructured":"Socher, R., Perelygin, A., et\u00a0al.: Recursive deep models for semantic compositionality over a sentiment treebank. In: Proceedings of the 2013 Conference on Empirical Methods in Natural Language Processing, pp. 1631\u20131642 (2013)","DOI":"10.18653\/v1\/D13-1170"},{"key":"36_CR34","unstructured":"Su, H., Kasai, J., et\u00a0al.: Selective annotation makes language models better few-shot learners. arXiv preprint arXiv:2209.01975 (2022)"},{"key":"36_CR35","unstructured":"Wang, H., Liu, C., et\u00a0al.: Prompt combines paraphrase: teaching pre-trained models to understand rare biomedical words. In: Proceedings of the 29th International Conference on Computational Linguistics, pp. 1422\u20131431 (2022)"},{"key":"36_CR36","doi-asserted-by":"crossref","unstructured":"Wang, H., Zhao, S., et\u00a0al.: Manifold-based verbalizer space re-embedding for tuning-free prompt-based classification. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol.\u00a038, pp. 19126\u201319134 (2024)","DOI":"10.1609\/aaai.v38i17.29880"},{"key":"36_CR37","doi-asserted-by":"publisher","first-page":"625","DOI":"10.1162\/tacl_a_00290","volume":"7","author":"A Warstadt","year":"2019","unstructured":"Warstadt, A., Singh, A., Bowman, S.R.: Neural network acceptability judgments. Trans. Assoc. Comput. Linguist. 7, 625\u2013641 (2019)","journal-title":"Trans. Assoc. Comput. Linguist."},{"issue":"1\u20133","key":"36_CR38","doi-asserted-by":"publisher","first-page":"37","DOI":"10.1016\/0169-7439(87)80084-9","volume":"2","author":"S Wold","year":"1987","unstructured":"Wold, S., Esbensen, K., Geladi, P.: Principal component analysis. Chemom. Intell. Lab. Syst. 2(1\u20133), 37\u201352 (1987)","journal-title":"Chemom. Intell. Lab. Syst."},{"key":"36_CR39","doi-asserted-by":"crossref","unstructured":"Yu, Y., Zhang, R., et\u00a0al.: Cold-start data selection for better few-shot language model fine-tuning: a prompt-based uncertainty propagation approach. In: Proceedings of the 61st Annual Meeting of the ACL, vol. 1: Long Papers, pp. 2499\u20132521 (2023)","DOI":"10.18653\/v1\/2023.acl-long.141"},{"key":"36_CR40","doi-asserted-by":"crossref","unstructured":"Yuan, M., Lin, H.T., Boyd-Graber, J.: Cold-start active learning through self-supervised language modeling. In: Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP), pp. 7935\u20137948 (2020)","DOI":"10.18653\/v1\/2020.emnlp-main.637"},{"key":"36_CR41","unstructured":"Zhang, N., Li, L., et\u00a0al.: Differentiable prompt makes pre-trained language models better few-shot learners. In: International Conference on Learning Representations (2021)"},{"key":"36_CR42","unstructured":"Zhang, X., Zhao, J., LeCun, Y.: Character-level convolutional networks for text classification. Adv. Neural Inf. Process. Syst. 28 (2015)"}],"container-title":["Lecture Notes in Computer Science","Advances in Knowledge Discovery and Data Mining"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-981-96-8170-9_36","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,14]],"date-time":"2025-06-14T18:50:52Z","timestamp":1749927052000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-981-96-8170-9_36"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"ISBN":["9789819681693","9789819681709"],"references-count":42,"URL":"https:\/\/doi.org\/10.1007\/978-981-96-8170-9_36","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025]]},"assertion":[{"value":"15 June 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"PAKDD","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Pacific-Asia Conference on Knowledge Discovery and Data Mining","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Sydney, NSW","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Australia","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"10 June 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"13 June 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"pakdd2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/pakdd2025.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}