{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,8]],"date-time":"2025-09-08T06:36:00Z","timestamp":1757313360070,"version":"3.40.3"},"publisher-location":"Cham","reference-count":22,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031417337"},{"type":"electronic","value":"9783031417344"}],"license":[{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023]]},"DOI":"10.1007\/978-3-031-41734-4_8","type":"book-chapter","created":{"date-parts":[[2023,8,18]],"date-time":"2023-08-18T07:02:59Z","timestamp":1692342179000},"page":"121-136","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["Optimizing the\u00a0Performance of\u00a0Text Classification Models by\u00a0Improving the\u00a0Isotropy of\u00a0the\u00a0Embeddings Using a\u00a0Joint Loss Function"],"prefix":"10.1007","author":[{"given":"Joseph","family":"Attieh","sequence":"first","affiliation":[]},{"given":"Abraham","family":"Woubie Zewoudie","sequence":"additional","affiliation":[]},{"given":"Vladimir","family":"Vlassov","sequence":"additional","affiliation":[]},{"given":"Adrian","family":"Flanagan","sequence":"additional","affiliation":[]},{"given":"Tom","family":"B\u00e4ckstr\u00f6m","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,8,19]]},"reference":[{"key":"8_CR1","unstructured":"Attieh, J.: Optimizing the Performance of Text Classification Models by Improving the Isotropy of the Embeddings using a Joint Loss Function. Master\u2019s thesis, Aalto University. School of Science (2022). http:\/\/urn.fi\/URN:NBN:fi:aalto-202209255727"},{"key":"8_CR2","doi-asserted-by":"publisher","unstructured":"Bi\u015b, D., Podkorytov, M., Liu, X.: Too much in common: Shifting of embeddings in transformer language models and its implications. In: Proceedings of the 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies. pp. 5117\u20135130. Association for Computational Linguistics, Online (Jun 2021). https:\/\/doi.org\/10.18653\/v1\/2021.naacl-main.403, http:\/\/aclanthology.org\/2021.naacl-main.403","DOI":"10.18653\/v1\/2021.naacl-main.403"},{"key":"8_CR3","doi-asserted-by":"crossref","unstructured":"Ethayarajh, K.: How contextual are contextualized word representations? comparing the geometry of BERT, ELMO, and GPT-2 embeddings. vol. abs\/1909.00512 (2019). arXiv: abs\/1909.00512","DOI":"10.18653\/v1\/D19-1006"},{"key":"8_CR4","unstructured":"Gao, J., He, D., Tan, X., Qin, T., Wang, L., Liu, T.: Representation degeneration problem in training natural language generation models. In: International Conference on Learning Representations (2019). http:\/\/openreview.net\/forum?id=SkEYojRqtm"},{"key":"8_CR5","unstructured":"Gong, C., He, D., Tan, X., Qin, T., Wang, L., Liu, T.Y.: Frage: Frequency-agnostic word representation. ArXiv arXiv:1809.06858 (2018)"},{"key":"8_CR6","doi-asserted-by":"publisher","unstructured":"Kalyan, K.S., Rajasekharan, A., Sangeetha, S.: Ammus : A survey of transformer-based pretrained models in natural language processing (2021). https:\/\/doi.org\/10.48550\/ARXIV.2108.05542,","DOI":"10.48550\/ARXIV.2108.05542"},{"key":"8_CR7","doi-asserted-by":"publisher","unstructured":"Li, B., Zhou, H., He, J., Wang, M., Yang, Y., Li, L.: On the sentence embeddings from pre-trained language models. In: Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP), pp. 9119\u20139130. Association for Computational Linguistics, Online (Nov 2020). https:\/\/doi.org\/10.18653\/v1\/2020.emnlp-main.733","DOI":"10.18653\/v1\/2020.emnlp-main.733"},{"key":"8_CR8","doi-asserted-by":"publisher","unstructured":"Liang, Y., Cao, R., Zheng, J., Ren, J., Gao, L.: Learning to remove: Towards isotropic pre-trained Bert embedding. In: Artificial Neural Networks and Machine Learning - ICANN 2021: 30th International Conference on Artificial Neural Networks, Bratislava, Slovakia, September 14\u201317, 2021, Proceedings, Part V, p. 448\u2013459. Springer-Verlag, Berlin, Heidelberg (2021). https:\/\/doi.org\/10.1007\/978-3-030-86383-8_36","DOI":"10.1007\/978-3-030-86383-8_36"},{"key":"8_CR9","doi-asserted-by":"publisher","unstructured":"Loshchilov, I., Hutter, F.: Decoupled weight decay regularization (2017). https:\/\/doi.org\/10.48550\/ARXIV.1711.05101","DOI":"10.48550\/ARXIV.1711.05101"},{"key":"8_CR10","unstructured":"Mu, J., Viswanath, P.: All-but-the-top: Simple and effective post-processing for word representations (2018), publisher Copyright: \u00a9 Learning Representations, ICLR 2018 - Conference Track Proceedings. All right reserved.; 6th International Conference on Learning Representations, ICLR 2018; Conference date: 30\u201304-2018 Through 03\u201305-2018"},{"key":"8_CR11","doi-asserted-by":"crossref","unstructured":"Rajaee, S., Pilehvar, M.T.: A cluster-based approach for improving isotropy in contextual embedding space. In: ACL (2021)","DOI":"10.18653\/v1\/2021.acl-short.73"},{"key":"8_CR12","doi-asserted-by":"crossref","unstructured":"Rajaee, S., Pilehvar, M.T.: How does fine-tuning affect the geometry of embedding space: a case study on isotropy. In: EMNLP (2021)","DOI":"10.18653\/v1\/2021.findings-emnlp.261"},{"key":"8_CR13","doi-asserted-by":"publisher","unstructured":"Rudman, W., Gillman, N., Rayne, T., Eickhoff, C.: IsoScore: Measuring the uniformity of embedding space utilization. In: Findings of the Association for Computational Linguistics: ACL 2022, pp. 3325\u20133339. Association for Computational Linguistics, Dublin, Ireland (May 2022). https:\/\/doi.org\/10.18653\/v1\/2022.findings-acl.262, http:\/\/aclanthology.org\/2022.findings-acl.262","DOI":"10.18653\/v1\/2022.findings-acl.262"},{"key":"8_CR14","doi-asserted-by":"publisher","unstructured":"Su, J., Cao, J., Liu, W., Ou, Y.: Whitening sentence representations for better semantics and faster retrieval (2021). https:\/\/doi.org\/10.48550\/ARXIV.2103.15316, http:\/\/arxiv.org\/abs\/2103.15316","DOI":"10.48550\/ARXIV.2103.15316"},{"key":"8_CR15","doi-asserted-by":"publisher","unstructured":"Timkey, W., van Schijndel, M.: All bark and no bite: Rogue dimensions in transformer language models obscure representational quality. In: Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing, pp. 4527\u20134546. Association for Computational Linguistics, Online and Punta Cana, Dominican Republic (Nov 2021). https:\/\/doi.org\/10.18653\/v1\/2021.emnlp-main.372, http:\/\/aclanthology.org\/2021.emnlp-main.372","DOI":"10.18653\/v1\/2021.emnlp-main.372"},{"key":"8_CR16","doi-asserted-by":"publisher","unstructured":"Wang, A., Singh, A., Michael, J., Hill, F., Levy, O., Bowman, S.: GLUE: A multi-task benchmark and analysis platform for natural language understanding. In: Proceedings of the 2018 EMNLP Workshop BlackboxNLP: Analyzing and Interpreting Neural Networks for NLP, pp. 353\u2013355. Association for Computational Linguistics, Brussels, Belgium (Nov 2018). https:\/\/doi.org\/10.18653\/v1\/W18-5446, http:\/\/aclanthology.org\/W18-5446","DOI":"10.18653\/v1\/W18-5446"},{"key":"8_CR17","unstructured":"Wang, L., Huang, J., Huang, K., Hu, Z., Wang, G., Gu, Q.: Improving neural language generation with spectrum control. In: International Conference on Learning Representations (2020). http:\/\/openreview.net\/forum?id=ByxY8CNtvr"},{"key":"8_CR18","doi-asserted-by":"publisher","unstructured":"Wolf, T., et al.: Huggingface\u2019s transformers: State-of-the-art natural language processing (2019). https:\/\/doi.org\/10.48550\/ARXIV.1910.03771","DOI":"10.48550\/ARXIV.1910.03771"},{"key":"8_CR19","unstructured":"Zabihzadeh, D.: Ensemble of loss functions to improve generalizability of deep metric learning methods. arXiv:2107.01130 (2021)"},{"key":"8_CR20","doi-asserted-by":"crossref","unstructured":"Zampieri, M., Malmasi, S., Nakov, P., Rosenthal, S., Farra, N., Kumar, R.: Predicting the Type and Target of Offensive Posts in Social Media. In: Proceedings of NAACL (2019)","DOI":"10.18653\/v1\/N19-1144"},{"key":"8_CR21","doi-asserted-by":"publisher","unstructured":"Zhang, Z., Gao, C., Xu, C., Miao, R., Yang, Q., Shao, J.: Revisiting representation degeneration problem in language modeling. In: Findings of the Association for Computational Linguistics: EMNLP 2020, pp. 518\u2013527. Association for Computational Linguistics, Online (Nov 2020). https:\/\/doi.org\/10.18653\/v1\/2020.findings-emnlp.46, http:\/\/aclanthology.org\/2020.findings-emnlp.46","DOI":"10.18653\/v1\/2020.findings-emnlp.46"},{"key":"8_CR22","doi-asserted-by":"crossref","unstructured":"Zhou, W., Lin, B.Y., Ren, X.: Isobn: Fine-tuning bert with isotropic batch normalization. Proc. AAAI Conf. Artif. Intell. 35(16), 14621\u201314629 (May 2021), http:\/\/ojs.aaai.org\/index.php\/AAAI\/article\/view\/17718","DOI":"10.1609\/aaai.v35i16.17718"}],"container-title":["Lecture Notes in Computer Science","Document Analysis and Recognition - ICDAR 2023"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-41734-4_8","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,8,18]],"date-time":"2023-08-18T07:10:20Z","timestamp":1692342620000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-41734-4_8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023]]},"ISBN":["9783031417337","9783031417344"],"references-count":22,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-41734-4_8","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2023]]},"assertion":[{"value":"19 August 2023","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ICDAR","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Document Analysis and Recognition","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"San Jos\u00e9, CA","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"USA","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2023","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"21 August 2023","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"26 August 2023","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"17","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"icdar2023","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/icdar2023.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Easychair","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"316","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"154","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"49% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"2.89","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"1.50","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"No","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Number and type of other papers accepted : IJDAR track papers","order":10,"name":"additional_info_on_review_process","label":"Additional Info on Review Process","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}