{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,2]],"date-time":"2025-08-02T14:33:06Z","timestamp":1754145186819,"version":"3.41.2"},"reference-count":84,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2025,1,1]],"date-time":"2025-01-01T00:00:00Z","timestamp":1735689600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Access"],"published-print":{"date-parts":[[2025]]},"DOI":"10.1109\/access.2025.3585679","type":"journal-article","created":{"date-parts":[[2025,7,3]],"date-time":"2025-07-03T13:29:56Z","timestamp":1751549396000},"page":"119197-119214","source":"Crossref","is-referenced-by-count":0,"title":["SMCLM: Semantically Meaningful Causal Language Modeling for Autoregressive Paraphrase Generation"],"prefix":"10.1109","volume":"13","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8646-3345","authenticated-orcid":false,"given":"Michal","family":"Pere\u0142kiewicz","sequence":"first","affiliation":[{"name":"National Information Processing Institute, Warsaw, Poland"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"S\u0142awomir","family":"Dadas","sequence":"additional","affiliation":[{"name":"National Information Processing Institute, Warsaw, Poland"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6108-2711","authenticated-orcid":false,"given":"Rafa\u0142","family":"Po\u015bwiata","sequence":"additional","affiliation":[{"name":"National Information Processing Institute, Warsaw, Poland"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2021.3052783"},{"key":"ref2","first-page":"5110","article-title":"From paraphrasing to semantic parsing: Unsupervised semantic parsing via synchronous semantic decoding","volume-title":"Proc. 59th Annu. Meeting Assoc. Comput. Linguistics 11th Int. Joint Conf. Natural Lang. Process.","author":"Wu"},{"key":"ref3","first-page":"1","article-title":"Machine translation within one language as a paraphrasing technique online","volume-title":"Proc. Conf. Theory Pract. Inf. Technol.","author":"Baran\u010d\u00edkov\u00e1"},{"key":"ref4","first-page":"4114","article-title":"Data augmentation with paraphrase generation and entity extraction for multimodal dialogue system","volume-title":"Proc. 13th Lang. Resources Eval. Conf.","author":"Okur"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/AITest55621.2022.00021"},{"key":"ref6","first-page":"5075","article-title":"Paraphrase generation: A survey of the state of the art","volume-title":"Proc. Conf. Empirical Methods Natural Lang. Process.","author":"Zhou"},{"issue":"3","key":"ref7","doi-asserted-by":"crossref","first-page":"341","DOI":"10.1162\/coli_a_00002","article-title":"Generating phrasal and sentential paraphrases: A survey of data-driven methods","volume":"36","author":"Madnani","year":"2010","journal-title":"Comput. Linguistics"},{"issue":"1","key":"ref8","first-page":"1","article-title":"Paraphrasing questions using given and new information","volume":"9","author":"McKeown","year":"1983","journal-title":"Amer. J. Comput. Linguistics"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1017\/S1351324901002765"},{"key":"ref10","first-page":"16","article-title":"Learning to paraphrase: An unsupervised approach using multiple-sequence alignment","volume-title":"Proc. Conf. North Amer. Chapter Assoc. Comput. Linguistics Hum. Lang. Technol.-NAACL","volume":"1","author":"Barzilay"},{"key":"ref11","first-page":"177","article-title":"Moses: Open source toolkit for statistical machine translation","volume-title":"Proc. 45th Annu. Meeting Assoc. Comput. Linguistics Companion","author":"Koehn"},{"key":"ref12","first-page":"2923","article-title":"Neural paraphrase generation with stacked residual LSTM networks","volume-title":"Proc. 26th Int. Conf. Comput. Linguistics","author":"Prakash"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v32i1.11956"},{"key":"ref14","first-page":"3609","article-title":"Submodular optimization-based diverse paraphrasing and its effectiveness in data augmentation","volume-title":"Proc. Conf. North Amer. Chapter Assoc. Comput. Linguistics","author":"Kumar"},{"key":"ref15","first-page":"2489","article-title":"Hierarchical sketch induction for paraphrase generation","volume-title":"Proc. 60th Annu. Meeting Assoc. Comput. Linguistics","author":"Hosking"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.eacl-main.88"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N18-1170"},{"key":"ref18","first-page":"238","article-title":"Neural syntactic preordering for controlled paraphrase generation","volume-title":"Proc. 58th Annu. Meeting Assoc. Comput. Linguistics","author":"Goyal"},{"key":"ref19","first-page":"3865","article-title":"Paraphrase generation with deep reinforcement learning","volume-title":"Proc. Conf. Empirical Methods Natural Lang. Process.","author":"Li"},{"key":"ref20","first-page":"3130","article-title":"An end-to-end generative architecture for paraphrase generation","volume-title":"Proc. Conf. Empirical Methods Natural Lang. Process. 9th Int. Joint Conf. Natural Lang. Process. (EMNLP-IJCNLP)","author":"Yang"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33016834"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.28"},{"key":"ref23","first-page":"7871","article-title":"BART: Denoising sequence-to-sequence pre-training for natural language generation, translation, and comprehension","volume-title":"Proc. 58th Annu. Meeting Assoc. Comput. Linguistics","author":"Lewis"},{"key":"ref24","article-title":"Exploring the limits of transfer learning with a unified text-to-text transformer","author":"Raffel","year":"2023","journal-title":"arXiv:1910.10683"},{"volume-title":"Language Models Are Unsupervised Multitask Learners","year":"2019","author":"Radford","key":"ref25"},{"key":"ref26","first-page":"5136","article-title":"Unsupervised paraphrasing with pretrained language models","volume-title":"Proc. Conf. Empirical Methods Natural Lang. Process.","author":"Niu"},{"key":"ref27","first-page":"3294","article-title":"Skip-thought vectors","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"28","author":"Kiros"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/n18-1049"},{"key":"ref29","first-page":"670","article-title":"Supervised learning of universal sentence representations from natural language inference data","volume-title":"Proc. Conf. Empirical Methods Natural Lang. Process.","author":"Conneau"},{"key":"ref30","article-title":"Universal sentence encoder","author":"Cer","year":"2018","journal-title":"arXiv: 1803.11175"},{"key":"ref31","first-page":"3982","article-title":"Sentence-BERT: Sentence embeddings using Siamese BERT-networks","volume-title":"Proc. Conf. Empirical Methods Natural Lang. Process. 9th Int. Joint Conf. Natural Lang. Process. (EMNLP-IJCNLP)","author":"Reimers"},{"key":"ref32","first-page":"6894","article-title":"SimCSE: Simple contrastive learning of sentence embeddings","volume-title":"Proc. Conf. Empirical Methods Natural Lang. Process.","author":"Gao"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.findings-emnlp.59"},{"key":"ref34","article-title":"Towards general text embeddings with multi-stage contrastive learning","author":"Li","year":"2023","journal-title":"arXiv:2308.03281"},{"key":"ref35","article-title":"Text embeddings by weakly-supervised contrastive pre-training","author":"Wang","year":"2022","journal-title":"arXiv:2212.03533"},{"key":"ref36","article-title":"Language-agnostic BERT sentence embedding","author":"Feng","year":"2020","journal-title":"arXiv:2007.01852"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.emnlp-main.365"},{"key":"ref38","article-title":"BGE M3-embedding: Multi-lingual, multi-functionality, multi-granularity text embeddings through self-knowledge distillation","author":"Chen","year":"2024","journal-title":"arXiv:2402.03216"},{"key":"ref39","article-title":"Jina embeddings 2: 8192-token general-purpose text embeddings for long documents","author":"Gunther","year":"2023","journal-title":"arXiv:2310.19923"},{"key":"ref40","article-title":"A comprehensive survey on long context language modeling","author":"Liu","year":"2025","journal-title":"arXiv:2503.17407"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1038\/s41467-021-25756-4"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-27779-8_27"},{"key":"ref43","first-page":"455","article-title":"Paraphrasing for automatic evaluation","volume-title":"Proc. Conf. Hum. Lang. Technol. Conf. North Amer. Chapter Assoc. Comput. Linguistics","author":"Kauchak"},{"key":"ref44","first-page":"203","article-title":"Paraphrase generation as monolingual translation: Data and evaluation","volume-title":"Proc. 6th Int. Natural Lang. Gener. Conf.","author":"Wubben"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/K16-1002"},{"key":"ref46","first-page":"3171","article-title":"Exploring diverse expressions for paraphrase generation","volume-title":"Proc. Conf. Empirical Methods Natural Lang. Process. 9th Int. Joint Conf. Natural Lang. Process. (EMNLP-IJCNLP)","author":"Qian"},{"key":"ref47","article-title":"Unsupervised contextual paraphrase generation using lexical control and reinforcement learning","author":"Garg","year":"2021","journal-title":"arXiv:2103.12777"},{"key":"ref48","first-page":"2411","article-title":"DivGAN: Towards diverse paraphrase generation via diversified generative adversarial network","volume-title":"Proc. Findings Assoc. Comput. Linguistics, EMNLP","author":"Cao"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D17-1026"},{"key":"ref50","article-title":"Attention is all you need","author":"Vaswani","year":"2017","journal-title":"arXiv:1706.03762"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33017176"},{"key":"ref52","first-page":"6033","article-title":"Unsupervised paraphrasing without translation","volume-title":"Proc. 57th Annu. Meeting Assoc. Comput. Linguistics","author":"Roy"},{"key":"ref53","first-page":"6309","article-title":"Neural discrete representation learning","volume-title":"Proc. 31st Int. Conf. Neural Inf. Process. Syst.","author":"Oord"},{"key":"ref54","first-page":"596","article-title":"Quality controlled paraphrase generation","volume-title":"Proc. 60th Annu. Meeting Assoc. Comput. Linguistics","author":"Bandel"},{"key":"ref55","first-page":"6193","article-title":"ParaMac: A general unsupervised paraphrase generation framework leveraging semantic constraints and diversifying mechanisms","volume-title":"Proc. Findings Assoc. Comput. Linguistics, EMNLP","author":"Liu"},{"issue":"2","key":"ref56","article-title":"Optimization of paraphrase generation and identification using language models in natural language processing","volume":"1","author":"Palivela","year":"2021","journal-title":"Int. J. Inf. Manage. Data Insights"},{"volume-title":"Improving Language Understanding by Generative Pre-Training","year":"2018","author":"Radford","key":"ref57"},{"key":"ref58","first-page":"1877","article-title":"Language models are few-shot learners","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Brown"},{"key":"ref59","first-page":"215","article-title":"Paraphrasing with large language models","volume-title":"Proc. 3rd Workshop Neural Gener. Transl.","author":"Witteveen"},{"key":"ref60","first-page":"1","article-title":"Efficient estimation of word representations in vector space","volume-title":"Proc. Int. Conf. Learn. Represent.","author":"Mikolov"},{"key":"ref61","first-page":"1681","article-title":"Deep unordered composition rivals syntactic methods for text classification","volume-title":"Proc. 53rd Annu. Meeting Assoc. Comput. Linguistics 7th Int. Joint Conf. Natural Lang. Process.","author":"Iyyer"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1109\/SMC53654.2022.9945218"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1145\/3593590"},{"key":"ref64","first-page":"2014","article-title":"MTEB: Massive text embedding benchmark","volume-title":"Proc. 17th Conf. Eur. Chapter Assoc. Comput. Linguistics","author":"Muennighoff"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1007\/s10506-024-09408-8"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.findings-emnlp.215"},{"key":"ref67","first-page":"5147","article-title":"Limitations of autoregressive models and their alternatives","volume-title":"Proc. Conf. North Amer. Chapter Assoc. Comput. Linguistics, Hum. Lang. Technol.","author":"Lin"},{"issue":"19","key":"ref68","first-page":"20418","article-title":"Numerical pruning for efficient autoregressive models","volume-title":"Proc. AAAI Conf. Artif. Intell.","volume":"39","author":"Shen"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1109\/TKDE.2021.3090866"},{"issue":"11","key":"ref70","doi-asserted-by":"crossref","first-page":"2451","DOI":"10.3390\/math11112451","article-title":"A mathematical interpretation of autoregressive generative pre-trained transformer and self-supervised learning","volume":"11","author":"Lee","year":"2023","journal-title":"Mathematics"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-10602-1_48"},{"issue":"4","key":"ref72","doi-asserted-by":"crossref","first-page":"664","DOI":"10.1109\/TPAMI.2016.2598339","article-title":"Deep visual-semantic alignments for generating image descriptions","volume":"39","author":"Karpathy","year":"2017","journal-title":"IEEE Trans.Pattern Anal. Mach. Intell."},{"key":"ref73","first-page":"1073","article-title":"Get to the point: Summarization with pointer-generator networks","volume-title":"Proc. 55th Annu. Meeting Assoc. Comput. Linguistics","author":"See"},{"key":"ref74","first-page":"1","article-title":"OPUS-MT\u2014Building open translation services for the world","volume-title":"Proc. 22nd Annu. Conf. Eur. Assoc. Mach. Transl. (EAMT)","author":"Tiedemann"},{"key":"ref75","article-title":"Unsupervised paraphrase generation using pre-trained language models","author":"Hegde","year":"2020","journal-title":"arXiv:2006.05477"},{"key":"ref76","article-title":"Diverse beam search: Decoding diverse solutions from neural sequence models","author":"Vijayakumar","year":"2016","journal-title":"arXiv:1610.02424"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.3115\/1073083.1073135"},{"key":"ref78","first-page":"74","article-title":"ROUGE: A package for automatic evaluation of summaries","volume-title":"Proc. Text Summarization Branches Out","author":"Lin"},{"key":"ref79","first-page":"1925","article-title":"Better summarization evaluation with word embeddings for ROUGE","volume-title":"Proc. Conf. Empirical Methods Natural Lang. Process.","author":"Ng"},{"key":"ref80","first-page":"2241","article-title":"Why we need new evaluation metrics for NLG","volume-title":"Proc. Conf. Empirical Methods Natural Lang. Process.","author":"Novikova"},{"key":"ref81","first-page":"119","article-title":"Evaluating question answering evaluation","volume-title":"Proc. 2nd Workshop Mach. Reading Question Answering","author":"Chen"},{"key":"ref82","first-page":"1097","article-title":"Texygen: A benchmarking platform for text generation models","volume-title":"Proc. 41st Int. ACM SIGIR Conf. Res. Develop. Inf. Retr.","author":"Zhu"},{"key":"ref83","first-page":"1","article-title":"BERTScore: Evaluating text generation with BERT","volume-title":"Proc. 8th Int. Conf. Learn. Represent.","author":"Zhang"},{"key":"ref84","first-page":"1631","article-title":"Incorporating copying mechanism in sequence-to-sequence learning","volume-title":"Proc. 54th Annu. Meeting Assoc. Comput. Linguistics","author":"Gu"}],"container-title":["IEEE Access"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/6287639\/10820123\/11068992.pdf?arnumber=11068992","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,16]],"date-time":"2025-07-16T17:40:13Z","timestamp":1752687613000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11068992\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025]]},"references-count":84,"URL":"https:\/\/doi.org\/10.1109\/access.2025.3585679","relation":{},"ISSN":["2169-3536"],"issn-type":[{"type":"electronic","value":"2169-3536"}],"subject":[],"published":{"date-parts":[[2025]]}}}