{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,1]],"date-time":"2025-10-01T15:17:23Z","timestamp":1759331843171,"version":"3.37.3"},"reference-count":63,"publisher":"Springer Science and Business Media LLC","issue":"10","license":[{"start":{"date-parts":[[2023,5,27]],"date-time":"2023-05-27T00:00:00Z","timestamp":1685145600000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,5,27]],"date-time":"2023-05-27T00:00:00Z","timestamp":1685145600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"DOI":"10.13039\/501100012166","name":"National Key R &D Program of China","doi-asserted-by":"crossref","award":["2020AAA0106501"],"award-info":[{"award-number":["2020AAA0106501"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"crossref"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62236004","61976072"],"award-info":[{"award-number":["62236004","61976072"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int. J. Mach. Learn. &amp; Cyber."],"published-print":{"date-parts":[[2023,10]]},"DOI":"10.1007\/s13042-023-01854-1","type":"journal-article","created":{"date-parts":[[2023,5,27]],"date-time":"2023-05-27T03:31:18Z","timestamp":1685158278000},"page":"3621-3639","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["Improving cross-lingual language understanding with consistency regularization-based fine-tuning"],"prefix":"10.1007","volume":"14","author":[{"given":"Bo","family":"Zheng","sequence":"first","affiliation":[]},{"given":"Wanxiang","family":"Che","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,5,27]]},"reference":[{"key":"1854_CR1","unstructured":"Aghajanyan A, Shrivastava A, Gupta A, et\u00a0al (2020) Better fine-tuning by reducing representational collapse. CoRR. arXiv:2008.03156"},{"key":"1854_CR2","doi-asserted-by":"crossref","unstructured":"Artetxe M, Ruder S, Yogatama D (2020) On the cross-lingual transferability of monolingual representations. In: Jurafsky D, Chai J, Schluter N, et\u00a0al (eds) Proceedings of the 58th annual meeting of the association for computational linguistics, ACL 2020, Online, July 5\u201310, 2020. Association for Computational Linguistics, pp 4623\u20134637. https:\/\/www.aclweb.org\/anthology\/2020.acl-main.421\/","DOI":"10.18653\/v1\/2020.acl-main.421"},{"key":"1854_CR3","unstructured":"Athiwaratkun B, Finzi M, Izmailov P, et\u00a0al (2019) There are many consistent explanations of unlabeled data: why you should average. In: 7th international conference on learning representations, ICLR 2019, New Orleans, LA, USA, May 6\u20139. OpenReview.net, https:\/\/openreview.net\/forum?id=rkgKBhA5Y7"},{"key":"1854_CR4","unstructured":"Carmon Y, Raghunathan A, Schmidt L, et\u00a0al (2019) Unlabeled data improves adversarial robustness. In: Wallach HM, Larochelle H, Beygelzimer A, et\u00a0al (eds) Advances in neural information processing systems 32: annual conference on neural information processing systems 2019, NeurIPS 2019, 8\u201314 December 2019, Vancouver, BC, Canada, pp 11190\u201311201. http:\/\/papers.nips.cc\/paper\/9298-unlabeled-data-improves-adversarial-robustness"},{"key":"1854_CR5","doi-asserted-by":"crossref","unstructured":"Chi Z, Dong L, Wei F, et\u00a0al (2020) InfoXLM: an information-theoretic framework for cross-lingual language model pre-training. CoRR. arXiv:2007.07834","DOI":"10.18653\/v1\/2021.naacl-main.280"},{"key":"1854_CR6","doi-asserted-by":"publisher","unstructured":"Chi Z, Dong L, Zheng B, et\u00a0al (2021) Improving pretrained cross-lingual language models via self-labeled word alignment. In: Zong C, Xia F, Li W, et\u00a0al (eds) Proceedings of the 59th annual meeting of the association for computational linguistics and the 11th international joint conference on natural language processing, ACL\/IJCNLP 2021, (vol 1: Long Papers), Virtual Event, August 1\u20136, 2021. Association for Computational Linguistics, pp 3418\u20133430. https:\/\/doi.org\/10.18653\/v1\/2021.acl-long.265","DOI":"10.18653\/v1\/2021.acl-long.265"},{"key":"1854_CR7","doi-asserted-by":"publisher","unstructured":"Chi Z, Huang S, Dong L, et\u00a0al (2022) XLM-E: cross-lingual language model pre-training via ELECTRA. In: Muresan S, Nakov P, Villavicencio A (eds) Proceedings of the 60th annual meeting of the association for computational linguistics (vol 1: Long Papers), ACL 2022, Dublin, Ireland, May 22\u201327, 2022. Association for Computational Linguistics, pp 6170\u20136182. https:\/\/doi.org\/10.18653\/v1\/2022.acl-long.427","DOI":"10.18653\/v1\/2022.acl-long.427"},{"key":"1854_CR8","doi-asserted-by":"publisher","unstructured":"Chung HW, Garrette D, Tan KC, et\u00a0al (2020) Improving multilingual models with language-clustered vocabularies. In: Webber B, Cohn T, He Y, et\u00a0al (eds) Proceedings of the 2020 conference on empirical methods in natural language processing, EMNLP 2020, Online, November 16\u201320, 2020. Association for Computational Linguistics, pp 4536\u20134546. https:\/\/doi.org\/10.18653\/v1\/2020.emnlp-main.367","DOI":"10.18653\/v1\/2020.emnlp-main.367"},{"key":"1854_CR9","doi-asserted-by":"crossref","unstructured":"Clark JH, Palomaki J, Nikolaev V, et\u00a0al (2020) Tydi QA: a benchmark for information-seeking question answering in typologically diverse languages. Trans Assoc Comput Linguist 8:454\u2013470. https:\/\/transacl.org\/ojs\/index.php\/tacl\/article\/view\/1929","DOI":"10.1162\/tacl_a_00317"},{"key":"1854_CR10","unstructured":"Conneau A, Lample G (2019) Cross-lingual language model pretraining. In: Wallach HM, Larochelle H, Beygelzimer A, et\u00a0al (eds) Advances in neural information processing systems 32: annual conference on neural information processing systems 2019, NeurIPS 2019, 8\u201314 December 2019, Vancouver, BC, Canada, pp 7057\u20137067. http:\/\/papers.nips.cc\/paper\/8928-cross-lingual-language-model-pretraining"},{"key":"1854_CR11","doi-asserted-by":"publisher","unstructured":"Conneau A, Rinott R, Lample G, et\u00a0al (2018) XNLI: evaluating cross-lingual sentence representations. In: Riloff E, Chiang D, Hockenmaier J, et\u00a0al (eds) Proceedings of the 2018 conference on empirical methods in natural language processing, Brussels, Belgium, October 31\u2013November 4, 2018. Association for Computational Linguistics, pp 2475\u20132485. https:\/\/doi.org\/10.18653\/v1\/d18-1269","DOI":"10.18653\/v1\/d18-1269"},{"key":"1854_CR12","doi-asserted-by":"crossref","unstructured":"Conneau A, Khandelwal K, Goyal N, et\u00a0al (2020a) Unsupervised cross-lingual representation learning at scale. In: Jurafsky D, Chai J, Schluter N, et\u00a0al (eds) Proceedings of the 58th annual meeting of the association for computational linguistics, ACL 2020, Online, July 5\u201310, 2020. Association for Computational Linguistics, pp 8440\u20138451. http:\/\/www.aclweb.org\/anthology\/2020.acl-main.747\/","DOI":"10.18653\/v1\/2020.acl-main.747"},{"key":"1854_CR13","doi-asserted-by":"crossref","unstructured":"Conneau A, Wu S, Li H, et\u00a0al (2020b) Emerging cross-lingual structure in pretrained language models. In: Jurafsky D, Chai J, Schluter N, et\u00a0al (eds) Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, ACL 2020, Online, July 5\u201310, 2020. Association for Computational Linguistics, pp 6022\u20136034. https:\/\/www.aclweb.org\/anthology\/2020.acl-main.536\/","DOI":"10.18653\/v1\/2020.acl-main.536"},{"key":"1854_CR14","doi-asserted-by":"publisher","unstructured":"Devlin J, Chang M, Lee K, et\u00a0al (2019) BERT: pre-training of deep bidirectional transformers for language understanding. In: Burstein J, Doran C, Solorio T (eds) Proceedings of the 2019 conference of the North American chapter of the Association for computational linguistics: human language technologies, NAACL-HLT 2019, Minneapolis, MN, USA, June 2\u20137, 2019, vol 1 (Long and Short Papers). Association for Computational Linguistics, pp 4171\u20134186. https:\/\/doi.org\/10.18653\/v1\/n19-1423","DOI":"10.18653\/v1\/n19-1423"},{"key":"1854_CR15","unstructured":"Fang Y, Wang S, Gan Z, et\u00a0al (2020) FILTER: an enhanced fusion method for cross-lingual language understanding. CoRR. arXiv:2009.05166"},{"key":"1854_CR16","doi-asserted-by":"publisher","unstructured":"Faruqui M, Dyer C (2014) Improving vector space word representations using multilingual correlation. In: Bouma G, Parmentier Y (eds) Proceedings of the 14th conference of the European chapter of the association for computational linguistics, EACL 2014, April 26\u201330, 2014, Gothenburg, Sweden. The Association for Computer Linguistics, pp 462\u2013471. https:\/\/doi.org\/10.3115\/v1\/e14-1049","DOI":"10.3115\/v1\/e14-1049"},{"key":"1854_CR17","doi-asserted-by":"crossref","unstructured":"Fei H, Zhang M, Ji D (2020) Cross-lingual semantic role labeling with high-quality translated training corpus. In: Jurafsky D, Chai J, Schluter N, et\u00a0al (eds) Proceedings of the 58th annual meeting of the association for computational linguistics, ACL 2020, Online, July 5\u201310, 2020. Association for Computational Linguistics, pp 7014\u20137026. http:\/\/www.aclweb.org\/anthology\/2020.acl-main.627\/","DOI":"10.18653\/v1\/2020.acl-main.627"},{"key":"1854_CR18","doi-asserted-by":"crossref","unstructured":"Gao T, Han X, Xie R, et\u00a0al (2020) Neural snowball for few-shot relation learning. In: The thirty-fourth AAAI conference on artificial intelligence, AAAI 2020, the thirty-second innovative applications of artificial intelligence conference, IAAI 2020, the tenth AAAI symposium on educational advances in artificial intelligence, EAAI 2020, New York, NY, USA, February 7\u201312, 2020. AAAI Press, pp 7772\u20137779. http:\/\/ojs.aaai.org\/index.php\/AAAI\/article\/view\/6281","DOI":"10.1609\/aaai.v34i05.6281"},{"key":"1854_CR19","doi-asserted-by":"publisher","unstructured":"Guo J, Che W, Yarowsky D, et\u00a0al (2015) Cross-lingual dependency parsing based on distributed representations. In: Proceedings of the 53rd annual meeting of the association for computational linguistics and the 7th international joint conference on natural language processing of the Asian federation of natural language processing, ACL 2015, July 26\u201331, 2015, Beijing, China, vol 1: Long Papers. The Association for Computer Linguistics, pp 1234\u20131244. https:\/\/doi.org\/10.3115\/v1\/p15-1119","DOI":"10.3115\/v1\/p15-1119"},{"key":"1854_CR20","doi-asserted-by":"publisher","unstructured":"Hou Y, Che W, Lai Y, et\u00a0al (2020) Few-shot slot tagging with collapsed dependency transfer and label-enhanced task-adaptive projection network. In: Jurafsky D, Chai J, Schluter N, et\u00a0al (eds) Proceedings of the 58th annual meeting of the association for computational linguistics, ACL 2020, Online, July 5-10, 2020. Association for Computational Linguistics, pp 1381\u20131393. https:\/\/doi.org\/10.18653\/v1\/2020.acl-main.128","DOI":"10.18653\/v1\/2020.acl-main.128"},{"key":"1854_CR21","unstructured":"Hou Y, Mao J, Lai Y, et\u00a0al (2020) Fewjoint: a few-shot learning benchmark for joint language understanding. CoRR. arXiv:2009.08138"},{"key":"1854_CR22","unstructured":"Hu J, Ruder S, Siddhant A, et\u00a0al (2020) XTREME: A massively multilingual multi-task benchmark for evaluating cross-lingual generalisation. In: Proceedings of the 37th international conference on machine learning, ICML 2020, 13\u201318 July 2020, virtual event, proceedings of machine learning research, vol 119. PMLR, pp 4411\u20134421. http:\/\/proceedings.mlr.press\/v119\/hu20b.html"},{"key":"1854_CR23","doi-asserted-by":"publisher","unstructured":"Hu J, Johnson M, Firat O, et\u00a0al (2021) Explicit alignment objectives for multilingual bidirectional encoders. In: Toutanova K, Rumshisky A, Zettlemoyer L, et\u00a0al (eds) Proceedings of the 2021 conference of the North American chapter of the association for computational linguistics: human language technologies, NAACL-HLT 2021, Online, June 6\u201311, 2021. Association for Computational Linguistics, pp 3633\u20133643. https:\/\/doi.org\/10.18653\/v1\/2021.naacl-main.284","DOI":"10.18653\/v1\/2021.naacl-main.284"},{"key":"1854_CR24","unstructured":"Hu W, Miyato T, Tokui S, et\u00a0al (2017) Learning discrete representations via information maximizing self-augmented training. In: Precup D, Teh YW (eds) Proceedings of the 34th international conference on machine learning, ICML 2017, Sydney, NSW, Australia, 6\u201311 August 2017, proceedings of machine learning research, vol\u00a070. PMLR, pp 1558\u20131567. http:\/\/proceedings.mlr.press\/v70\/hu17b.html"},{"key":"1854_CR25","doi-asserted-by":"crossref","unstructured":"Jiang H, He P, Chen W, et\u00a0al (2020) SMART: Robust and efficient fine-tuning for pre-trained natural language models through principled regularized optimization. In: Jurafsky D, Chai J, Schluter N, et\u00a0al (eds) Proceedings of the 58th annual meeting of the association for computational linguistics, ACL 2020, Online, July 5\u201310, 2020. Association for Computational Linguistics, pp 2177\u20132190. https:\/\/www.aclweb.org\/anthology\/2020.acl-main.197\/","DOI":"10.18653\/v1\/2020.acl-main.197"},{"key":"1854_CR26","doi-asserted-by":"publisher","unstructured":"Kudo T (2018) Subword regularization: Improving neural network translation models with multiple subword candidates. In: Gurevych I, Miyao Y (eds) Proceedings of the 56th annual meeting of the association for computational linguistics, ACL 2018, Melbourne, Australia, July 15\u201320, 2018, vol 1: long papers. Association for Computational Linguistics, pp 66\u201375. https:\/\/doi.org\/10.18653\/v1\/P18-1007. https:\/\/www.aclweb.org\/anthology\/P18-1007\/","DOI":"10.18653\/v1\/P18-1007"},{"key":"1854_CR27","doi-asserted-by":"publisher","unstructured":"Kudo T, Richardson J (2018) Sentencepiece: A simple and language independent subword tokenizer and detokenizer for neural text processing. In: Blanco E, Lu W (eds) Proceedings of the 2018 conference on empirical methods in natural language processing, EMNLP 2018: system demonstrations, Brussels, Belgium, October 31\u2013November 4, 2018. Association for Computational Linguistics, pp 66\u201371. https:\/\/doi.org\/10.18653\/v1\/d18-2012","DOI":"10.18653\/v1\/d18-2012"},{"key":"1854_CR28","unstructured":"Lample G, Conneau A, Denoyer L, et\u00a0al (2018) Unsupervised machine translation using monolingual corpora only. In: 6th international conference on learning representations, ICLR 2018, Vancouver, BC, Canada, April 30\u2013May 3, 2018, conference track proceedings. OpenReview.net, http:\/\/openreview.net\/forum?id=rkYTTf-AZ"},{"key":"1854_CR29","doi-asserted-by":"publisher","unstructured":"Lauscher A, Ravishankar V, Vulic I, et\u00a0al (2020) From zero to hero: On the limitations of zero-shot language transfer with multilingual transformers. In: Webber B, Cohn T, He Y, et\u00a0al (eds) Proceedings of the 2020 conference on empirical methods in natural language processing, EMNLP 2020, Online, November 16\u201320, 2020. Association for Computational Linguistics, pp 4483\u20134499. https:\/\/doi.org\/10.18653\/v1\/2020.emnlp-main.363","DOI":"10.18653\/v1\/2020.emnlp-main.363"},{"key":"1854_CR30","doi-asserted-by":"crossref","unstructured":"Lewis PSH, Oguz B, Rinott R, et\u00a0al (2020) MLQA: evaluating cross-lingual extractive question answering. In: Jurafsky D, Chai J, Schluter N, et\u00a0al (eds) Proceedings of the 58th annual meeting of the association for computational linguistics, ACL 2020, Online, July 5\u201310, 2020. Association for Computational Linguistics, pp 7315\u20137330. http:\/\/www.aclweb.org\/anthology\/2020.acl-main.653\/","DOI":"10.18653\/v1\/2020.acl-main.653"},{"key":"1854_CR31","doi-asserted-by":"publisher","unstructured":"Li H, Yan H, Li Y, et\u00a0al (2023) Distinguishability calibration to in-context learning. CoRR. https:\/\/doi.org\/10.48550\/arXiv.2302.06198. arXiv:2302.06198","DOI":"10.48550\/arXiv.2302.06198"},{"key":"1854_CR32","unstructured":"Liu X, Cheng H, He P, et\u00a0al (2020) Adversarial training for large neural language models. CoRR. arXiv:2004.08994"},{"key":"1854_CR33","doi-asserted-by":"crossref","unstructured":"Luo F, Wang W, Liu J, et\u00a0al (2020) VECO: Variable encoder-decoder pre-training for cross-lingual understanding and generation. arXiv:2010.16046","DOI":"10.18653\/v1\/2021.acl-long.308"},{"key":"1854_CR34","doi-asserted-by":"publisher","unstructured":"Lv X, Gu Y, Han X, et\u00a0al (2019) Adapting meta knowledge graph information for multi-hop reasoning over few-shot relations. In: Inui K, Jiang J, Ng V, et\u00a0al (eds) Proceedings of the 2019 conference on empirical methods in natural language processing and the 9th international joint conference on natural language processing, EMNLP-IJCNLP 2019, Hong Kong, China, November 3\u20137, 2019. Association for Computational Linguistics, pp 3374\u20133379. https:\/\/doi.org\/10.18653\/v1\/D19-1334","DOI":"10.18653\/v1\/D19-1334"},{"key":"1854_CR35","unstructured":"Mikolov T, Le QV, Sutskever I (2013) Exploiting similarities among languages for machine translation. CoRR. arXiv:1309.4168"},{"issue":"8","key":"1854_CR36","doi-asserted-by":"publisher","first-page":"1979","DOI":"10.1109\/TPAMI.2018.2858821","volume":"41","author":"T Miyato","year":"2019","unstructured":"Miyato T, Maeda S, Koyama M et al (2019) Virtual adversarial training: a regularization method for supervised and semi-supervised learning. IEEE Trans Pattern Anal Mach Intell 41(8):1979\u20131993. https:\/\/doi.org\/10.1109\/TPAMI.2018.2858821","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"1854_CR37","unstructured":"Nivre J, Blokland R, Partanen N, et\u00a0al (2018) Universal dependencies 2.2"},{"key":"1854_CR38","doi-asserted-by":"publisher","unstructured":"Pan X, Zhang B, May J, et\u00a0al (2017) Cross-lingual name tagging and linking for 282 languages. In: Barzilay R, Kan M (eds) Proceedings of the 55th annual meeting of the association for computational linguistics, ACL 2017, Vancouver, Canada, July 30\u2013August 4, volume 1: long papers. Association for Computational Linguistics, pp 1946\u20131958. https:\/\/doi.org\/10.18653\/v1\/P17-1178","DOI":"10.18653\/v1\/P17-1178"},{"key":"1854_CR39","unstructured":"Phang J, Htut PM, Pruksachatkun Y, et\u00a0al (2020) English intermediate-task training improves zero-shot cross-lingual transfer too. CoRR. arXiv:2005.13013"},{"key":"1854_CR40","doi-asserted-by":"crossref","unstructured":"Provilkov I, Emelianenko D, Voita E (2020) BPE-dropout: simple and effective subword regularization. In: Jurafsky D, Chai J, Schluter N, et\u00a0al (eds) Proceedings of the 58th annual meeting of the association for computational linguistics, ACL 2020, Online, July 5\u201310, 2020. Association for Computational Linguistics, pp 1882\u20131892. https:\/\/www.aclweb.org\/anthology\/2020.acl-main.170\/","DOI":"10.18653\/v1\/2020.acl-main.170"},{"key":"1854_CR41","doi-asserted-by":"publisher","unstructured":"Qin L, Ni M, Zhang Y, et\u00a0al (2020) CoSDA-ML: multi-lingual code-switching data augmentation for zero-shot cross-lingual NLP. In: Bessiere C (eds) Proceedings of the twenty-ninth international joint conference on artificial intelligence, IJCAI 2020. ijcai.org, pp 3853\u20133860. https:\/\/doi.org\/10.24963\/ijcai.2020\/533","DOI":"10.24963\/ijcai.2020\/533"},{"key":"1854_CR42","doi-asserted-by":"publisher","unstructured":"Shah DJ, Gupta R, Fayazi AA, et\u00a0al (2019) Robust zero-shot cross-domain slot filling with example values. In: Korhonen A, Traum DR, M\u00e0rquez L (eds) Proceedings of the 57th conference of the association for computational linguistics, ACL 2019, Florence, Italy, July 28\u2013August 2, 2019, vol 1: long papers. Association for Computational Linguistics, pp 5484\u20135490. https:\/\/doi.org\/10.18653\/v1\/p19-1547","DOI":"10.18653\/v1\/p19-1547"},{"key":"1854_CR43","unstructured":"Singh J, McCann B, Keskar NS, et\u00a0al (2019) XLDA: cross-lingual data augmentation for natural language inference and question answering. CoRR. arXiv:1905.11471"},{"key":"1854_CR44","doi-asserted-by":"publisher","unstructured":"Sun S, Sun Q, Zhou K, et\u00a0al (2019) Hierarchical attention prototypical networks for few-shot text classification. In: Inui K, Jiang J, Ng V, et\u00a0al (eds) Proceedings of the 2019 conference on empirical methods in natural language processing and the 9th international joint conference on natural language processing, EMNLP-IJCNLP 2019, Hong Kong, China, November 3\u20137, 2019. Association for Computational Linguistics, pp 476\u2013485. https:\/\/doi.org\/10.18653\/v1\/D19-1045","DOI":"10.18653\/v1\/D19-1045"},{"key":"1854_CR45","unstructured":"Tarvainen A, Valpola H (2017) Mean teachers are better role models: Weight-averaged consistency targets improve semi-supervised deep learning results. In: 5th international conference on learning representations, ICLR 2017, Toulon, France, April 24\u201326, 2017, Workshop Track Proceedings. OpenReview.net, http:\/\/openreview.net\/forum?id=ry8u21rtl"},{"key":"1854_CR46","doi-asserted-by":"publisher","unstructured":"Wang Y, Che W, Guo J, et\u00a0al (2019) Cross-lingual BERT transformation for zero-shot dependency parsing. In: Inui K, Jiang J, Ng V, et\u00a0al (eds) Proceedings of the 2019 conference on empirical methods in natural language processing and the 9th international joint conference on natural language processing, EMNLP-IJCNLP 2019, Hong Kong, China, November 3\u20137, 2019. Association for Computational Linguistics, pp 5720\u20135726. https:\/\/doi.org\/10.18653\/v1\/D19-1575","DOI":"10.18653\/v1\/D19-1575"},{"key":"1854_CR47","unstructured":"Xie Q, Dai Z, Hovy EH, et\u00a0al (2020) Unsupervised data augmentation for consistency training. In: Larochelle H, Ranzato M, Hadsell R, et\u00a0al (eds) Advances in neural information processing systems 33: annual conference on neural information processing systems 2020, NeurIPS 2020, December 6\u201312, 2020, virtual. http:\/\/proceedings.neurips.cc\/paper\/2020\/hash\/44feb0096faa8326192570788b38c1d1-Abstract.html"},{"key":"1854_CR48","doi-asserted-by":"crossref","unstructured":"Xu H, Murray K (2022) Por qu\u00e9 n\u00e3o utiliser alla spr\u00e5k? mixed training with gradient optimization in few-shot cross-lingual transfer. CoRR. arXiv:2204.13869","DOI":"10.18653\/v1\/2022.findings-naacl.157"},{"key":"1854_CR49","doi-asserted-by":"publisher","unstructured":"Xu R, Yang Y, Otani N, et\u00a0al (2018) Unsupervised cross-lingual transfer of word embedding spaces. In: Riloff E, Chiang D, Hockenmaier J, et\u00a0al (eds) Proceedings of the 2018 conference on empirical methods in natural language processing, Brussels, Belgium, October 31\u2013November 4, 2018. Association for Computational Linguistics, pp 2465\u20132474. https:\/\/doi.org\/10.18653\/v1\/d18-1268","DOI":"10.18653\/v1\/d18-1268"},{"issue":"4","key":"1854_CR50","doi-asserted-by":"publisher","first-page":"987","DOI":"10.1162\/coli\\_a_00459","volume":"48","author":"H Yan","year":"2022","unstructured":"Yan H, Gui L, He Y (2022) Hierarchical interpretation of neural text classification. Comput Linguist 48(4):987\u20131020. https:\/\/doi.org\/10.1162\/coli_a_00459","journal-title":"Comput Linguist"},{"key":"1854_CR51","unstructured":"Yan H, Gui L, Li W, et\u00a0al (2022b) Addressing token uniformity in transformers via singular value transformation. In: Cussens J, Zhang K (eds) Uncertainty in artificial intelligence, proceedings of the thirty-eighth conference on uncertainty in artificial intelligence, UAI 2022, 1\u20135 August 2022, Eindhoven, The Netherlands, proceedings of machine learning research, vol 180. PMLR, pp 2181\u20132191. http:\/\/proceedings.mlr.press\/v180\/yan22b.html"},{"issue":"22","key":"1854_CR52","doi-asserted-by":"publisher","first-page":"29799","DOI":"10.1007\/s11042-018-5772-4","volume":"77","author":"L Yan","year":"2018","unstructured":"Yan L, Zheng Y, Cao J (2018) Few-shot learning for short text classification. Multimed Tools Appl 77(22):29799\u201329810. https:\/\/doi.org\/10.1007\/s11042-018-5772-4","journal-title":"Multimed Tools Appl"},{"key":"#cr-split#-1854_CR53.1","unstructured":"Yang H, Chen H, Zhou H et al (2022) Enhancing cross-lingual transfer by"},{"key":"#cr-split#-1854_CR53.2","unstructured":"manifold mixup. In: The 10th International conference on learning representations, ICLR 2022. Virtual Event. April 25-29, 2022"},{"key":"1854_CR54","doi-asserted-by":"publisher","unstructured":"Yang Y, Zhang Y, Tar C, et\u00a0al (2019) PAWS-X: A cross-lingual adversarial dataset for paraphrase identification. In: Inui K, Jiang J, Ng V, et\u00a0al (eds) Proceedings of the 2019 conference on empirical methods in natural language processing and the 9th international joint conference on natural language processing, EMNLP-IJCNLP 2019, Hong Kong, China, November 3\u20137, 2019. Association for Computational Linguistics, pp 3685\u20133690. https:\/\/doi.org\/10.18653\/v1\/D19-1382","DOI":"10.18653\/v1\/D19-1382"},{"key":"1854_CR55","doi-asserted-by":"publisher","unstructured":"Ye M, Zhang X, Yuen PC, et\u00a0al (2019) Unsupervised embedding learning via invariant and spreading instance feature. In: IEEE conference on computer vision and pattern recognition, CVPR 2019, Long Beach, CA, USA, June 16\u201320, 2019. Computer Vision Foundation\/IEEE, pp 6210\u20136219. https:\/\/doi.org\/10.1109\/CVPR.2019.00637. http:\/\/openaccess.thecvf.com\/content_CVPR_2019\/html\/Ye_Unsupervised_Embedding_Learning_via_Invariant_and_Spreading_Instance_Feature_CVPR_2019_paper.html","DOI":"10.1109\/CVPR.2019.00637"},{"key":"1854_CR56","doi-asserted-by":"publisher","unstructured":"Yu M, Guo X, Yi J, et\u00a0al (2018) Diverse few-shot text classification with multiple metrics. In: Walker MA, Ji H, Stent A (eds) Proceedings of the 2018 conference of the North American chapter of the association for computational linguistics: human language technologies, NAACL-HLT 2018, New Orleans, Louisiana, USA, June 1\u20136, 2018, vol 1 (long papers). Association for Computational Linguistics, pp 1206\u20131215. https:\/\/doi.org\/10.18653\/v1\/n18-1109","DOI":"10.18653\/v1\/n18-1109"},{"key":"1854_CR57","doi-asserted-by":"publisher","unstructured":"Zhang M, Zhang Y, Fu G (2019) Cross-lingual dependency parsing using code-mixed treebank. In: Inui K, Jiang J, Ng V, et\u00a0al (eds) Proceedings of the 2019 conference on empirical methods in natural language processing and the 9th international joint conference on natural language processing, EMNLP-IJCNLP 2019, Hong Kong, China, November 3\u20137, 2019. Association for Computational Linguistics, pp 997\u20131006. https:\/\/doi.org\/10.18653\/v1\/D19-1092","DOI":"10.18653\/v1\/D19-1092"},{"key":"1854_CR58","doi-asserted-by":"publisher","unstructured":"Zhao M, Zhu Y, Shareghi E, et\u00a0al (2021) A closer look at few-shot crosslingual transfer: the choice of shots matters. In: Zong C, Xia F, Li W, et\u00a0al (eds) Proceedings of the 59th annual meeting of the association for computational linguistics and the 11th international joint conference on natural language processing, ACL\/IJCNLP 2021, (vol 1: long papers), virtual event, August 1\u20136, 2021. Association for Computational Linguistics, pp 5751\u20135767. https:\/\/doi.org\/10.18653\/v1\/2021.acl-long.447","DOI":"10.18653\/v1\/2021.acl-long.447"},{"key":"1854_CR59","doi-asserted-by":"publisher","unstructured":"Zhao W, Eger S, Bjerva J, et\u00a0al (2021) Inducing language-agnostic multilingual representations. In: Nastase V, Vulic I (eds) Proceedings of *SEM 2021: the tenth joint conference on lexical and computational semantics, *SEM 2021, Online, August 5\u20136, 2021. Association for Computational Linguistics, pp 229\u2013240. https:\/\/doi.org\/10.18653\/v1\/2021.starsem-1.22","DOI":"10.18653\/v1\/2021.starsem-1.22"},{"key":"1854_CR60","doi-asserted-by":"publisher","unstructured":"Zheng B, Dong L, Huang S, et\u00a0al (2021) Allocating large vocabulary capacity for cross-lingual language model pre-training. In: Moens M, Huang X, Specia L, et\u00a0al (eds) Proceedings of the 2021 conference on empirical methods in natural language processing, EMNLP 2021, virtual event\/Punta Cana, Dominican Republic, 7\u201311 November, 2021. Association for Computational Linguistics, pp 3203\u20133215. https:\/\/doi.org\/10.18653\/v1\/2021.emnlp-main.257","DOI":"10.18653\/v1\/2021.emnlp-main.257"},{"key":"1854_CR61","doi-asserted-by":"publisher","unstructured":"Zheng S, Song Y, Leung T, et\u00a0al (2016) Improving the robustness of deep neural networks via stability training. In: 2016 IEEE conference on computer vision and pattern recognition, CVPR 2016, Las Vegas, NV, USA, June 27\u201330, 2016. IEEE Computer Society, pp 4480\u20134488. https:\/\/doi.org\/10.1109\/CVPR.2016.485","DOI":"10.1109\/CVPR.2016.485"},{"key":"1854_CR62","unstructured":"Zhu C, Cheng Y, Gan Z, et\u00a0al (2020) FreeLB: enhanced adversarial training for natural language understanding. In: 8th international conference on learning representations, ICLR 2020, Addis Ababa, Ethiopia, April 26\u201330, 2020. OpenReview.net, https:\/\/openreview.net\/forum?id=BygzbyHFvB"}],"container-title":["International Journal of Machine Learning and Cybernetics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s13042-023-01854-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s13042-023-01854-1\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s13042-023-01854-1.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,8,22]],"date-time":"2023-08-22T05:29:33Z","timestamp":1692682173000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s13042-023-01854-1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,5,27]]},"references-count":63,"journal-issue":{"issue":"10","published-print":{"date-parts":[[2023,10]]}},"alternative-id":["1854"],"URL":"https:\/\/doi.org\/10.1007\/s13042-023-01854-1","relation":{},"ISSN":["1868-8071","1868-808X"],"issn-type":[{"type":"print","value":"1868-8071"},{"type":"electronic","value":"1868-808X"}],"subject":[],"published":{"date-parts":[[2023,5,27]]},"assertion":[{"value":"6 February 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"1 May 2023","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"27 May 2023","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}