{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,30]],"date-time":"2026-01-30T11:51:23Z","timestamp":1769773883360,"version":"3.49.0"},"publisher-location":"Cham","reference-count":23,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783032159861","type":"print"},{"value":"9783032159878","type":"electronic"}],"license":[{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026]]},"DOI":"10.1007\/978-3-032-15987-8_16","type":"book-chapter","created":{"date-parts":[[2026,1,29]],"date-time":"2026-01-29T20:27:24Z","timestamp":1769718444000},"page":"239-254","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["CLS, Averaging, or\u00a0Layer Combinations? Embedding Strategies for\u00a0Text Classification Across BERT Variants"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-4246-2126","authenticated-orcid":false,"given":"Eliton Luiz Scardin","family":"Perin","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1746-8414","authenticated-orcid":false,"given":"Mariana Caravanti","family":"de Souza","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4339-3003","authenticated-orcid":false,"given":"Anderson Bessa","family":"Costa","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4471-0886","authenticated-orcid":false,"given":"Edson Takashi","family":"Matsubara","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2026,1,30]]},"reference":[{"key":"16_CR1","doi-asserted-by":"crossref","unstructured":"Choi, H., Kim, J., Joe, S., Gwon, Y.: Evaluation of BERT and ALBERT sentence embedding performance on downstream NLP tasks. In: 2020 25th International Conference on Pattern Recognition (ICPR), pp. 5482\u20135487. IEEE (2021)","DOI":"10.1109\/ICPR48806.2021.9412102"},{"key":"16_CR2","doi-asserted-by":"publisher","unstructured":"Devlin, J., Chang, M.W., Lee, K., Toutanova, K.: BERT: pre-training of deep bidirectional transformers for language understanding. In: Burstein, J., Doran, C., Solorio, T. (eds.) Proceedings of the 2019 Conference of the North, vol. abs\/1810.04805, pp. 4171\u20134186. Association for Computational Linguistics, Minneapolis, Minnesota (2019). https:\/\/doi.org\/10.18653\/v1\/N19-1423, https:\/\/aclanthology.org\/N19-1423","DOI":"10.18653\/v1\/N19-1423"},{"key":"16_CR3","doi-asserted-by":"publisher","first-page":"6518","DOI":"10.1109\/access.2024.3349952","volume":"12","author":"J Fields","year":"2024","unstructured":"Fields, J., Chovanec, K., Madiraju, P.: A survey of text classification with transformers: how wide? how large? how long? how accurate? how expensive? how safe? IEEE Access 12, 6518\u20136531 (2024). https:\/\/doi.org\/10.1109\/access.2024.3349952","journal-title":"IEEE Access"},{"issue":"1","key":"16_CR4","doi-asserted-by":"publisher","first-page":"139","DOI":"10.1162\/coli_a_00536","volume":"51","author":"J Fodor","year":"2025","unstructured":"Fodor, J., Deyne, S.D., Suzuki, S.: Compositionality and sentence meaning: comparing semantic parsing and transformers on a challenging sentence similarity dataset. Comput. Linguist. 51(1), 139\u2013190 (2025)","journal-title":"Comput. Linguist."},{"issue":"1","key":"16_CR5","doi-asserted-by":"publisher","first-page":"28","DOI":"10.1186\/s40537-024-00885-x","volume":"11","author":"O Galal","year":"2024","unstructured":"Galal, O., Abdel-Gawad, A.H., Farouk, M.: Federated freeze BERT for text classification. J. Big Data 11(1), 28 (2024)","journal-title":"J. Big Data"},{"issue":"32","key":"16_CR6","doi-asserted-by":"publisher","first-page":"20245","DOI":"10.1007\/s00521-024-10212-3","volume":"36","author":"O Galal","year":"2024","unstructured":"Galal, O., Abdel-Gawad, A.H., Farouk, M.: Rethinking of BERT sentence embedding for text classification. Neural Comput. Appl. 36(32), 20245\u201320258 (2024)","journal-title":"Neural Comput. Appl."},{"key":"16_CR7","unstructured":"He, P., Gao, J., Chen, W.: DeBERTav3: improving deBERTa using ELECTRA-style pre-training with gradient-disentangled embedding sharing. In: The Eleventh International Conference on Learning Representations (2023). https:\/\/openreview.net\/forum?id=sE7-XhLxHA"},{"key":"16_CR8","doi-asserted-by":"publisher","unstructured":"Huang, J., et al.: WhiteningBERT: an easy unsupervised sentence embedding approach. In: Moens, M.F., Huang, X., Specia, L., Yih, S.W.t. (eds.) Findings of the Association for Computational Linguistics: EMNLP 2021, pp. 238\u2013244. Association for Computational Linguistics, Punta Cana, Dominican Republic (2021). https:\/\/doi.org\/10.18653\/v1\/2021.findings-emnlp.23, https:\/\/aclanthology.org\/2021.findings-emnlp.23\/","DOI":"10.18653\/v1\/2021.findings-emnlp.23"},{"key":"16_CR9","doi-asserted-by":"publisher","unstructured":"Kowsari, K., Jafari Meimandi, K., Heidarysafa, M., Mendu, S., Barnes, L., Brown, D.: Text classification algorithms: a survey. Information 10(4), 150 (2019). https:\/\/doi.org\/10.3390\/info10040150, https:\/\/www.mdpi.com\/2078-2489\/10\/4\/150","DOI":"10.3390\/info10040150"},{"key":"16_CR10","doi-asserted-by":"crossref","unstructured":"Li, X., Roth, D.: Learning question classifiers. In: COLING 2002: The 19th International Conference on Computational Linguistics (2002). https:\/\/aclanthology.org\/C02-1150\/","DOI":"10.3115\/1072228.1072378"},{"key":"16_CR11","unstructured":"Liu, Y., et al.: RoBERTa: a robustly optimized BERT pretraining approach. arXiv preprint arXiv:1907.11692 (2019)"},{"key":"16_CR12","doi-asserted-by":"publisher","unstructured":"Moschitti, A., Basili, R.: Complex linguistic features for text classification: a comprehensive study. In: McDonald, S., Tait, J. (eds.) Advances in Information Retrieval, pp. 181\u2013196. Springer Berlin Heidelberg, Berlin, Heidelberg (2004). https:\/\/doi.org\/10.1007\/978-3-540-24752-4_14","DOI":"10.1007\/978-3-540-24752-4_14"},{"key":"16_CR13","doi-asserted-by":"crossref","unstructured":"Pang, B., Lee, L.: Seeing stars: exploiting class relationships for sentiment categorization with respect to rating scales. In: Proceedings of the ACL (2005)","DOI":"10.3115\/1219840.1219855"},{"key":"16_CR14","doi-asserted-by":"publisher","unstructured":"Phan, X.H., Nguyen, L.M., Horiguchi, S.: Learning to classify short and sparse text & web with hidden topics from large-scale data collections. In: WWW 2008, Proceedings of the 17th International Conference on World Wide Web, pp. 91\u2013100. Association for Computing Machinery, New York, NY, USA (2008). https:\/\/doi.org\/10.1145\/1367497.1367510","DOI":"10.1145\/1367497.1367510"},{"key":"16_CR15","doi-asserted-by":"crossref","unstructured":"Reimers, N., Gurevych, I.: Sentence-BERT: sentence embeddings using siamese BERT-networks. arXiv preprint arXiv:1908.10084 (2019)","DOI":"10.18653\/v1\/D19-1410"},{"key":"16_CR16","unstructured":"Sanh, V., Debut, L., Chaumond, J., Wolf, T.: Distilbert, a distilled version of BERT: smaller, faster, cheaper and lighter. ArXiv arXiv:1910.01108 (2020)"},{"key":"16_CR17","doi-asserted-by":"crossref","unstructured":"Socher, R., et al.: Recursive deep models for semantic compositionality over a sentiment treebank. In: Yarowsky, D., Baldwin, T., Korhonen, A., Livescu, K., Bethard, S. (eds.) Proceedings of the 2013 Conference on Empirical Methods in Natural Language Processing, pp. 1631\u20131642. Association for Computational Linguistics, Seattle, Washington, USA (2013). https:\/\/aclanthology.org\/D13-1170\/","DOI":"10.18653\/v1\/D13-1170"},{"key":"16_CR18","unstructured":"Song, K., Tan, X., Qin, T., Lu, J., Liu, T.Y.: MPNet: masked and permuted pre-training for language understanding. In: Advances in Neural Information Processing Systems. Curran Associates Inc., Red Hook, NY, USA (2020)"},{"key":"16_CR19","doi-asserted-by":"crossref","unstructured":"Warner, B., et al.: Smarter, better, faster, longer: a modern bidirectional encoder for fast, memory efficient, and long context finetuning and inference. arXiv:2412.13663 (2024)","DOI":"10.18653\/v1\/2025.acl-long.127"},{"key":"16_CR20","doi-asserted-by":"publisher","unstructured":"Wu, Y., Wan, J.: A survey of text classification based on pre-trained language model. Neurocomputing 616, 128921 (2025). https:\/\/doi.org\/10.1016\/j.neucom.2024.128921, https:\/\/www.sciencedirect.com\/science\/article\/pii\/S0925231224016928","DOI":"10.1016\/j.neucom.2024.128921"},{"key":"16_CR21","doi-asserted-by":"publisher","unstructured":"Yao, L., Mao, C., Luo, Y.: Graph convolutional networks for text classification. In: Proceedings of the AAAI Conference on Artificial Intelligence, vol. 33, no. 01, pp. 7370\u20137377 (2019). https:\/\/doi.org\/10.1609\/aaai.v33i01.33017370, https:\/\/ojs.aaai.org\/index.php\/AAAI\/article\/view\/4725","DOI":"10.1609\/aaai.v33i01.33017370"},{"key":"16_CR22","doi-asserted-by":"crossref","unstructured":"Yin, W., Shang, L.: Efficient nearest neighbor emotion classification with BERT-whitening. In: Proceedings of the 2022 Conference on Empirical Methods in Natural Language Processing, pp. 4738\u20134745 (2022)","DOI":"10.18653\/v1\/2022.emnlp-main.312"},{"key":"16_CR23","doi-asserted-by":"crossref","unstructured":"Zheng, L., Guha, N., Anderson, B.R., Henderson, P., Ho, D.E.: When does pretraining help? assessing self-supervised learning for law and the casehold dataset. In: Proceedings of the 18th International Conference on Artificial Intelligence and Law. Association for Computing Machinery (2021)","DOI":"10.1145\/3462757.3466088"}],"container-title":["Lecture Notes in Computer Science","Intelligent Systems"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-032-15987-8_16","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,1,29]],"date-time":"2026-01-29T20:27:27Z","timestamp":1769718447000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-032-15987-8_16"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026]]},"ISBN":["9783032159861","9783032159878"],"references-count":23,"URL":"https:\/\/doi.org\/10.1007\/978-3-032-15987-8_16","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026]]},"assertion":[{"value":"30 January 2026","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"BRACIS","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Brazilian Conference on Intelligent Systems","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Fortaleza-CE","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Brazil","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2 October 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"14","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"bracis2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/bracis.sbc.org.br\/2025\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}