{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T10:28:35Z","timestamp":1743071315120,"version":"3.40.3"},"publisher-location":"Cham","reference-count":37,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031429132"},{"type":"electronic","value":"9783031429149"}],"license":[{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023]]},"DOI":"10.1007\/978-3-031-42914-9_9","type":"book-chapter","created":{"date-parts":[[2023,8,27]],"date-time":"2023-08-27T23:02:26Z","timestamp":1693177346000},"page":"119-132","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Comparing and\u00a0Improving Active Learning Uncertainty Measures for\u00a0Transformer Models"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-5985-4348","authenticated-orcid":false,"given":"Julius","family":"Gonsior","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Christian","family":"Falkenberg","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Silvio","family":"Magino","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2537-9841","authenticated-orcid":false,"given":"Anja","family":"Reusch","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5334-059X","authenticated-orcid":false,"given":"Claudio","family":"Hartmann","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1665-977X","authenticated-orcid":false,"given":"Maik","family":"Thiele","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8107-2775","authenticated-orcid":false,"given":"Wolfgang","family":"Lehner","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2023,8,28]]},"reference":[{"key":"9_CR1","unstructured":"Baram, Y., Yaniv, R.E., Luz, K.: Online choice of active learning algorithms. J. Mach. Learn. Res. 5(Mar), 255\u2013291 (2004)"},{"key":"9_CR2","unstructured":"Coleman, C., et al.: Selection via proxy: Efficient data selection for deep learning. ICLR (2020)"},{"key":"9_CR3","unstructured":"D\u2019Arcy, M., Downey, D.: Limitations of active learning with deep transformer language models (2022)"},{"key":"9_CR4","unstructured":"Devlin, J., Chang, M.W., Lee, K., Toutanova, K.: Bert: Pre-training of deep bidirectional transformers for language understanding. In: NAACL, pp. 4171\u20134186. Association for Computational Linguistics (2019)"},{"key":"9_CR5","unstructured":"Gal, Y., Ghahramani, Z.: Dropout as a bayesian approximation: Representing model uncertainty in deep learning. In: ICML, pp. 1050\u20131059. PMLR (2016)"},{"key":"9_CR6","unstructured":"Gal, Y., Islam, R., Ghahramani, Z.: Deep bayesian active learning with image data. In: International Conference on Machine Learning, pp. 1183\u20131192. PMLR (2017)"},{"key":"9_CR7","unstructured":"Gawlikowski, J., et al.: A survey of uncertainty in deep neural networks. arXiv preprint arXiv:2107.03342 (2021)"},{"key":"9_CR8","unstructured":"Gleave, A., Irving, G.: Uncertainty estimation for language reward models. arXiv preprint arXiv:2203.07472 (2022)"},{"key":"9_CR9","unstructured":"Gonsior, J., Rehak, J., Thiele, M., Koci, E., G\u00fcnther, M., Lehner, W.: Active learning for spreadsheet cell classification. In: EDBT\/ICDT Workshops (2020)"},{"key":"9_CR10","doi-asserted-by":"publisher","first-page":"47","DOI":"10.1007\/978-3-031-18840-4_4","volume-title":"Discovery Science","author":"J Gonsior","year":"2022","unstructured":"Gonsior, J., Thiele, M., Lehner, W.: Imital: learned active learning strategy on synthetic data. In: Pascal, P., Ienco, D. (eds.) Discovery Science, pp. 47\u201356. Springer Nature Switzerland, Cham (2022)"},{"key":"9_CR11","doi-asserted-by":"crossref","unstructured":"Hein, M., Andriushchenko, M., Bitterwolf, J.: Why relu networks yield high-confidence predictions far away from the training data and how to mitigate the problem. In: CVPR, pp. 41\u201350. IEEE (2019)","DOI":"10.1109\/CVPR.2019.00013"},{"key":"9_CR12","doi-asserted-by":"crossref","unstructured":"Hsu, W.N., Lin, H.T.: Active learning by learning. In: Proceedings of the Twenty-Ninth AAAI Conference on Artificial Intelligence, pp. 2659\u20132665. AAAI\u201915, AAAI Press (2015)","DOI":"10.1609\/aaai.v29i1.9597"},{"key":"9_CR13","unstructured":"Jiang, H., Kim, B., Guan, M., Gupta, M.: To trust or not to trust a classifier. In: NeurIPS 31 (2018)"},{"key":"9_CR14","doi-asserted-by":"crossref","unstructured":"Karamcheti, S., Krishna, R., Fei-Fei, L., Manning, C.: Mind your outliers! investigating the negative impact of outliers on active learning for visual question answering. In: ACL-IJCNLP, pp. 7265\u20137281. Association for Computational Linguistics (2021)","DOI":"10.18653\/v1\/2021.acl-long.564"},{"key":"9_CR15","unstructured":"Lakshminarayanan, B., Pritzel, A., Blundell, C.: Simple and scalable predictive uncertainty estimation using deep ensembles. In: NeurIPS 30 (2017)"},{"issue":"7553","key":"9_CR16","doi-asserted-by":"publisher","first-page":"436","DOI":"10.1038\/nature14539","volume":"521","author":"Y LeCun","year":"2015","unstructured":"LeCun, Y., Bengio, Y., Hinton, G.: Deep learning. Nature 521(7553), 436\u2013444 (2015)","journal-title":"Nature"},{"key":"9_CR17","doi-asserted-by":"crossref","unstructured":"Lewis, D.D., Gale, W.A.: A sequential algorithm for training text classifiers. In: SIGIR \u201994, pp. 3\u201312. Springer, London (1994)","DOI":"10.1007\/978-1-4471-2099-5_1"},{"key":"9_CR18","unstructured":"Liu, Y., et al.: Roberta: A robustly optimized bert pretraining approach. arXiv preprint arXiv:1907.11692 (2019)"},{"key":"9_CR19","doi-asserted-by":"crossref","unstructured":"Lowell, D., Lipton, Z.C., Wallace, B.C.: Practical obstacles to deploying active learning. In: EMNLP-IJCNLP, pp. 21\u201330 (2019)","DOI":"10.18653\/v1\/D19-1003"},{"key":"9_CR20","unstructured":"McCallumzy, A.K., Nigamy, K.: Employing em and pool-based active learning for text classification. In: ICML, pp. 359\u2013367. Citeseer (1998)"},{"key":"9_CR21","unstructured":"Mo\u017cejko, M., Susik, M., Karczewski, R.: Inhibited softmax for uncertainty estimation in neural networks. arXiv preprint arXiv:1810.01861 (2018)"},{"key":"9_CR22","unstructured":"Pearce, T., Brintrup, A., Zhu, J.: Understanding softmax confidence and uncertainty. arXiv preprint arXiv:2106.04972 (2021)"},{"key":"9_CR23","unstructured":"Sankararaman, K.A., Wang, S., Fang, H.: Bayesformer: Transformer with uncertainty estimation. arXiv preprint arXiv:2206.00826 (2022)"},{"key":"9_CR24","doi-asserted-by":"crossref","unstructured":"Scheffer, T., Decomain, C., Wrobel, S.: Mining the web with active hidden markov models. In: Hoffmann, F., Hand, D.J., Adams, N., Fisher, D., Guimaraes, G. (eds.) ICDM, pp. 309\u2013318. IEEE Comput. Soc (2001)","DOI":"10.1007\/3-540-44816-0_31"},{"key":"9_CR25","unstructured":"Schr\u00f6der, C., M\u00fcller, L., Niekler, A., Potthast, M.: Small-text: Active learning for text classification in python. arXiv preprint arXiv:2107.10314 (2021)"},{"key":"9_CR26","unstructured":"Schr\u00f6der, C., Niekler, A.: A survey of active learning for text classification using deep neural networks. arXiv preprint arXiv:2008.07267 (2020)"},{"key":"9_CR27","doi-asserted-by":"crossref","unstructured":"Schr\u00f6der, C., Niekler, A., Potthast, M.: Revisiting uncertainty-based query strategies for active learning with transformers. In: ACL, pp. 2194\u20132203. Association for Computational Linguistics (2022)","DOI":"10.18653\/v1\/2022.findings-acl.172"},{"key":"9_CR28","unstructured":"Sensoy, M., Kaplan, L., Kandemir, M.: Evidential deep learning to quantify classification uncertainty. In: NeurIPS 31 (2018)"},{"issue":"1","key":"9_CR29","first-page":"1","volume":"6","author":"B Settles","year":"2012","unstructured":"Settles, B.: Active learning. Synth. Lect. Artif. Intell. Mach. Learn. 6(1), 1\u2013114 (2012)","journal-title":"Synth. Lect. Artif. Intell. Mach. Learn."},{"key":"9_CR30","doi-asserted-by":"crossref","unstructured":"Seung, H.S., Opper, M., Sompolinsky, H.: Query by committee. In: Proceedings of the Fifth Annual Workshop On Computational Learning Theory, pp. 287\u2013294. COLT \u201992, ACM (1992)","DOI":"10.1145\/130385.130417"},{"issue":"3","key":"9_CR31","doi-asserted-by":"publisher","first-page":"379","DOI":"10.1002\/j.1538-7305.1948.tb01338.x","volume":"27","author":"CE Shannon","year":"1948","unstructured":"Shannon, C.E.: A mathematical theory of communication. Bell Syst. Tech. J. 27(3), 379\u2013423 (1948)","journal-title":"Bell Syst. Tech. J."},{"key":"9_CR32","doi-asserted-by":"crossref","unstructured":"Szegedy, C., Vanhoucke, V., Ioffe, S., Shlens, J., Wojna, Z.: Rethinking the inception architecture for computer vision. In: CVPR, pp. 2818\u20132826. IEEE (2016)","DOI":"10.1109\/CVPR.2016.308"},{"key":"9_CR33","unstructured":"Vaswani, A., Shazeer, N., Parmar, N., Uszkoreit, J., Jones, L., Gomez, A.N., Kaiser, L., Polosukhin, I.: Attention is all you need. In: NeurIPS 30 (2017)"},{"key":"9_CR34","doi-asserted-by":"crossref","unstructured":"Weiss, M., Tonella, P.: Simple techniques work surprisingly well for neural network test prioritization and active learning (replicability study). arXiv preprint arXiv:2205.00664 (2022)","DOI":"10.1145\/3533767.3534375"},{"key":"9_CR35","doi-asserted-by":"crossref","unstructured":"Yoo, D., Kweon, I.S.: Learning loss for active learning. In: Proceedings of the IEEE\/CVF Conference On Computer Vision and Pattern Recognition, pp. 93\u2013102 (2019)","DOI":"10.1109\/CVPR.2019.00018"},{"key":"9_CR36","doi-asserted-by":"crossref","unstructured":"Zhan, X., Liu, H., Li, Q., Chan, A.B.: A comparative survey: Benchmarking for pool-based active learning. In: IJCAI, pp. 4679\u20134686 (2021), survey Track","DOI":"10.24963\/ijcai.2021\/634"},{"key":"9_CR37","unstructured":"Zhang, J., Kailkhura, B., Han, T.Y.J.: Mix-n-match: Ensemble and compositional methods for uncertainty calibration in deep learning. In: ICML, pp. 11117\u201311128. PMLR (2020)"}],"container-title":["Lecture Notes in Computer Science","Advances in Databases and Information Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-42914-9_9","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,8,27]],"date-time":"2023-08-27T23:15:40Z","timestamp":1693178140000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-42914-9_9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023]]},"ISBN":["9783031429132","9783031429149"],"references-count":37,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-42914-9_9","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2023]]},"assertion":[{"value":"28 August 2023","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ADBIS","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Advances in Databases and Information Systems","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Barcelona","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Spain","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2023","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 September 2023","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"7 September 2023","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"27","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"adbis2023","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/adbis.eu\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Single-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"CMT","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"77","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"14","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"25","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"18% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"N\/A","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"N\/A","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}