{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,10]],"date-time":"2026-02-10T17:48:58Z","timestamp":1770745738997,"version":"3.49.0"},"reference-count":49,"publisher":"Springer Science and Business Media LLC","issue":"30","license":[{"start":{"date-parts":[[2024,2,15]],"date-time":"2024-02-15T00:00:00Z","timestamp":1707955200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,2,15]],"date-time":"2024-02-15T00:00:00Z","timestamp":1707955200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Multimed Tools Appl"],"DOI":"10.1007\/s11042-024-18359-w","type":"journal-article","created":{"date-parts":[[2024,2,15]],"date-time":"2024-02-15T08:02:47Z","timestamp":1707984167000},"page":"74205-74232","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":6,"title":["Identification of paraphrased text in research articles through improved embeddings and fine-tuned BERT model"],"prefix":"10.1007","volume":"83","author":[{"given":"Abdur","family":"Razaq","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3094-3483","authenticated-orcid":false,"given":"Zahid","family":"Halim","sequence":"additional","affiliation":[]},{"given":"Atta","family":"Ur Rahman","sequence":"additional","affiliation":[]},{"given":"Kholla","family":"Sikandar","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,2,15]]},"reference":[{"issue":"6","key":"18359_CR1","doi-asserted-by":"publisher","first-page":"922","DOI":"10.1016\/j.ipm.2018.06.005","volume":"54","author":"B Agarwal","year":"2018","unstructured":"Agarwal B, Ramampiaro H, Langseth H, Ruocco M (2018) A deep network model for paraphrase detection in short text messages. Inf Process Manage 54(6):922\u2013937","journal-title":"Inf Process Manage"},{"issue":"1","key":"18359_CR2","first-page":"1","volume":"18","author":"A Mahmoud","year":"2021","unstructured":"Mahmoud A, Zrigui M (2021) Semantic similarity analysis for corpus development and paraphrase detection in Arabic. Int Arab J Inf Technol 18(1):1\u20137","journal-title":"Int Arab J Inf Technol"},{"key":"18359_CR3","doi-asserted-by":"crossref","unstructured":"Aravinda Reddy D, Anand Kumar M, Soman KP (2019) LSTM based paraphrase identification using combined word embedding features. In Soft computing and signal processing. Springer, Singapore, pp 385-394","DOI":"10.1007\/978-981-13-3393-4_40"},{"key":"18359_CR4","doi-asserted-by":"crossref","unstructured":"Bunk S, Krestel R (2018) WELDA: enhancing topic models by incorporating local word context. In: Proceedings of the 18th ACM\/IEEE on joint conference on digital libraries, pp 293\u2013302","DOI":"10.1145\/3197026.3197043"},{"key":"18359_CR5","first-page":"1","volume-title":"Quora question pairs","author":"Z Chen","year":"2018","unstructured":"Chen Z, Zhang H, Zhang X, Zhao L (2018) Quora question pairs. University of Waterloo, pp 1\u20137"},{"key":"18359_CR6","doi-asserted-by":"publisher","first-page":"425","DOI":"10.1016\/j.eswa.2018.10.017","volume":"118","author":"S Dabiri","year":"2019","unstructured":"Dabiri S, Heaslip K (2019) Developing a Twitter-based traffic event detection model using deep learning architectures. Expert Syst Appl 118:425\u2013439","journal-title":"Expert Syst Appl"},{"key":"18359_CR7","doi-asserted-by":"crossref","unstructured":"Das D, Smith NA (2009) Paraphrase identification as probabilistic quasi-synchronous recognition. In: Proceedings of the joint conference of the 47th annual meeting of the ACL and the 4th international joint conference on natural language processing of the AFNLP. Association for Computational Linguistics, Suntec, pp 468\u2013476","DOI":"10.3115\/1687878.1687944"},{"key":"18359_CR8","unstructured":"Dey K, Shrivastava R, Kaushik S (2016) A paraphrase and semantic similarity detection system for user generated short-text content on microblogs. In: Proceedings of COLING 2016, the 26th international conference on computational linguistics: technical papers, pp 2880\u20132890"},{"issue":"10","key":"18359_CR9","first-page":"3039","volume":"12","author":"V Dogra","year":"2021","unstructured":"Dogra V (2021) Banking news-events representation and classification with a novel hybrid model using DistilBERT and rule-based features. Turk J Comput Math Education (TURCOMAT) 12(10):3039\u20133054","journal-title":"Turk J Comput Math Education (TURCOMAT)"},{"key":"18359_CR10","unstructured":"Dolan B, Brockett C (2005) Automatically constructing a corpus of sentential paraphrases. In: Third international workshop on paraphrasing (IWP2005)"},{"key":"18359_CR11","doi-asserted-by":"crossref","unstructured":"Dolan W, Quirk C, Brockett C, Dolan B (2004) Unsupervised construction of large paraphrase corpora: Exploiting massively parallel news sources. In: COLING 2004: Proceedings of the 20th international conference on computational linguistics, Geneva, pp 350\u2013356","DOI":"10.3115\/1220355.1220406"},{"key":"18359_CR12","doi-asserted-by":"crossref","unstructured":"Eyecioglu A, Keller B (2015) Twitter paraphrase identification with simple overlap features and SVMs. In: Proceedings of the 9th international workshop on semantic evaluation (SemEval 2015), pp 64\u201369","DOI":"10.18653\/v1\/S15-2011"},{"key":"18359_CR13","doi-asserted-by":"crossref","unstructured":"Felbo B, Mislove A, S\u00f8gaard A, Rahwan I, Lehmann S (2017) Using millions of emoji occurrences to learn any-domain representations for detecting sentiment, emotion, and sarcasm. arXiv preprint  arXiv:1708.00524","DOI":"10.18653\/v1\/D17-1169"},{"key":"18359_CR14","doi-asserted-by":"publisher","first-page":"59","DOI":"10.1016\/j.csl.2017.07.002","volume":"47","author":"R Ferreira","year":"2018","unstructured":"Ferreira R, Cavalcanti GD, Freitas F, Lins RD, Simske SJ, Riss M (2018) Combining sentence similarities measures to identify paraphrases. Comput Speech Lang 47:59\u201373","journal-title":"Comput Speech Lang"},{"key":"18359_CR15","unstructured":"Heilman M, Smith NA (2010) Tree edit models for recognizing textual entailments, paraphrases, and answers to questions. In: Human language technologies: The 2010 annual conference of the north American chapter of the association for computational linguistics, pp 1011\u20131019"},{"key":"18359_CR16","unstructured":"Hu B, Lu Z, Li H, Chen Q (2014) Convolutional neural network architectures for matching natural language sentences. Adv Neural Inform Process Syst p 27"},{"key":"18359_CR17","unstructured":"Ji Y, Eisenstein J (2013) Discriminative improvements to distributional sentence similarity. In: Proceedings of the 2013 conference on empirical methods in natural language processing, pp 891\u2013896"},{"key":"18359_CR18","doi-asserted-by":"crossref","unstructured":"Jinesh YI, Gawade S, Palivela H (2022) \"Feature Extraction from Radiology Images for Visual Question Answering System Using CNN and BiLSTM Model.\" Recent Innovations in Computing. Springer, Singapore, pp 317\u2013331","DOI":"10.1007\/978-981-16-8248-3_26"},{"key":"18359_CR19","doi-asserted-by":"crossref","unstructured":"Karan M, Glava\u0161 G, \u0160najder J, Dalbelo Ba\u0161i\u0107 B, Vulic I, Moens MF (2015) Tklbliir: Detecting Twitter paraphrases with tweeting Jay. In Proceedings of the 9th International Workshop on Semantic Evaluation (SemEval 2015) (pp. 70\u201374). ACL; East Stroudsburg, PA","DOI":"10.18653\/v1\/S15-2012"},{"key":"18359_CR20","doi-asserted-by":"publisher","first-page":"116677","DOI":"10.1016\/j.eswa.2022.116677","volume":"197","author":"K Yalcin","year":"2022","unstructured":"Yalcin K, Cicekli I, Ercan G (2022) An external plagiarism detection system based on part-of-speech (POS) tag n-grams and word embedding. Expert Syst Appl 197:116677","journal-title":"Expert Syst Appl"},{"key":"18359_CR21","unstructured":"Lan W, Xu W (2018) Neural network models for paraphrase identification, semantic textual similarity, natural language inference, and question answering. In: Proceedings of the 27th international conference on computational linguistics, pp 3890\u20133902"},{"key":"18359_CR22","doi-asserted-by":"publisher","first-page":"2835023","DOI":"10.1155\/2020\/2835023","volume":"2020","author":"W Lian","year":"2020","unstructured":"Lian W, Nie G, Jia B, Shi D, Fan Q, Liang Y (2020) An intrusion detection method based on decision tree-recursive feature elimination in ensemble learning. Math Probl Eng 2020:2835023","journal-title":"Math Probl Eng"},{"issue":"1","key":"18359_CR23","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/s13638-017-0993-1","volume":"2017","author":"H Liang","year":"2017","unstructured":"Liang H, Sun X, Sun Y, Gao Y (2017) Text feature extraction based on deep learning: a review. EURASIP J Wirel Commun Netw 2017(1):1\u201312","journal-title":"EURASIP J Wirel Commun Netw"},{"key":"18359_CR24","unstructured":"Madnani N, Tetreault J, Chodorow M (2012) Re-examining machine translation metrics for paraphrase identification. In: Proceedings of the 2012 conference of the North American chapter of the Association for Computational Linguistics: human language technologies, pp 182\u2013190"},{"issue":"3","key":"18359_CR25","doi-asserted-by":"publisher","first-page":"640","DOI":"10.1016\/j.ipm.2017.01.002","volume":"53","author":"AS Mohammad","year":"2017","unstructured":"Mohammad AS, Jaradat Z, Mahmoud AA, Jararweh Y (2017) Paraphrase identification and semantic text similarity analysis in Arabic news tweets using lexical, syntactic, and semantic features. Inf Process Manage 53(3):640\u2013652","journal-title":"Inf Process Manage"},{"key":"18359_CR26","unstructured":"Ngoc Phuoc An V, Magnolini S, Popescu O (2015) Paraphrase identification and semantic similarity in twitter with simple features. In: The 3rd international workshop on natural language processing for social media, pp 10\u201319"},{"key":"18359_CR27","doi-asserted-by":"crossref","unstructured":"Nighojkar A, Licato J (2021) Improving paraphrase detection with the adversarial paraphrasing task. In Proceedings of the 59th annual meeting of the association for computational linguistics and the 11th international joint conference on natural language processing, (Volume 1: Long papers), pp 7106\u20137116","DOI":"10.18653\/v1\/2021.acl-long.552"},{"issue":"4","key":"18359_CR28","doi-asserted-by":"publisher","first-page":"390","DOI":"10.1016\/j.datak.2011.01.002","volume":"70","author":"J Oliva","year":"2011","unstructured":"Oliva J, Serrano JI, Del Castillo MD, Iglesias \u00c1 (2011) SyMSS: A syntax-based measure for short-text semantic similarity. Data Knowl Eng 70(4):390\u2013405","journal-title":"Data Knowl Eng"},{"key":"18359_CR29","doi-asserted-by":"publisher","DOI":"10.3115\/1073445.1073469","volume-title":"Syntax-based alignment of multiple translations: extracting paraphrases and generating new sentences","author":"B Pang","year":"2003","unstructured":"Pang B, Knight K, Marcu D (2003) Syntax-based alignment of multiple translations: extracting paraphrases and generating new sentences. Cornell University Ithaca NY, Department Computer Science"},{"key":"18359_CR30","doi-asserted-by":"crossref","unstructured":"Pennington J, Socher R, Manning CD (2014) Glove: Global vectors for word representation. In: Proceedings of the 2014 conference on empirical methods in natural language processing (EMNLP), pp 1532\u20131543","DOI":"10.3115\/v1\/D14-1162"},{"key":"18359_CR31","doi-asserted-by":"crossref","unstructured":"Peng Q, Weir D, Weeds J, Chai Y (2022) Predicate-argument based bi-encoder for paraphrase identification. In: Proceedings of the 60th annual meeting of the association for computational linguistics (volume 1: long papers), pp 5579\u20135589","DOI":"10.18653\/v1\/2022.acl-long.382"},{"issue":"6","key":"18359_CR32","doi-asserted-by":"publisher","first-page":"102060","DOI":"10.1016\/j.ipm.2019.102060","volume":"56","author":"J Rashid","year":"2019","unstructured":"Rashid J, Shah SMA, Irtaza A (2019) Fuzzy topic modeling approach for text mining over short text. Inf Process Manage 56(6):102060","journal-title":"Inf Process Manage"},{"key":"18359_CR33","doi-asserted-by":"crossref","unstructured":"Jain R, Kathuria A, Singh A, Saxena A, Khandelwal A (2022) ParaCap: paraphrase detection model using capsule network. Multimed Syst pp 1\u201319","DOI":"10.1007\/s00530-020-00746-6"},{"key":"18359_CR34","doi-asserted-by":"crossref","unstructured":"Chawla S, Aggarwal P, Kaur R (2022) Comparative analysis of semantic similarity word embedding techniques for paraphrase detection. In: Emerging technologies for computing, communication, and smart cities: Proceedings of ETCCS 2021, Springer, pp 15\u201329","DOI":"10.1007\/978-981-19-0284-0_2"},{"key":"18359_CR35","doi-asserted-by":"crossref","unstructured":"Reimers N, Gurevych I (2017) Reporting score distributions makes a difference: Performance study of lstm-networks for sequence tagging. arXiv preprint  arXiv:1707.09861","DOI":"10.18653\/v1\/D17-1035"},{"key":"18359_CR36","unstructured":"Rus V, McCarthy PM, Lintean MC, McNamara DS, Graesser AC (2008). Paraphrase Identification with Lexico-Syntactic Graph Subsumption. In FLAIRS Conference, pp 201\u2013206"},{"issue":"4","key":"18359_CR37","doi-asserted-by":"publisher","first-page":"6479","DOI":"10.1007\/s11042-020-09996-y","volume":"80","author":"H Shahmohammadi","year":"2021","unstructured":"Shahmohammadi H, Dezfoulian M, Mansoorizadeh M (2021) Paraphrase detection using LSTM networks and handcrafted features. Multimed Tools Appl 80(4):6479\u20136492","journal-title":"Multimed Tools Appl"},{"issue":"3","key":"18359_CR38","doi-asserted-by":"publisher","first-page":"102204","DOI":"10.1016\/j.ipm.2020.102204","volume":"57","author":"MH Shakeel","year":"2020","unstructured":"Shakeel MH, Karim A, Khan I (2020) A multi-cascaded model with data augmentation for enhanced paraphrase detection in short texts. Inf Process Manage 57(3):102204","journal-title":"Inf Process Manage"},{"key":"18359_CR39","unstructured":"Socher R, Huang E, Pennin J, Manning CD, Ng A (2011) Dynamic pooling and unfolding recursive autoencoders for paraphrase detection. Adv Neural Inform Process Syst p 24"},{"key":"18359_CR40","doi-asserted-by":"crossref","unstructured":"Wang Z, Hamza W, Florian R (2017) Bilateral multi-perspective matching for natural language sentences. arXiv preprint  arXiv:1702.03814","DOI":"10.24963\/ijcai.2017\/579"},{"key":"18359_CR41","unstructured":"Wang Z, Mi H, Ittycheriah A (2016) Sentence similarity learning by lexical decomposition and composition. In: Proceedings of COLING 2016, the 26th international conference on computational linguistics: Technical papers, pp 1340\u20131349"},{"issue":"1","key":"18359_CR42","doi-asserted-by":"publisher","first-page":"103154","DOI":"10.1016\/j.ipm.2022.103154","volume":"60","author":"X Xie","year":"2023","unstructured":"Xie X, Li Z, Tang Z, Yao D, Ma H (2023) Unifying knowledge iterative dissemination and relational reconstruction network for image\u2013text matching. Inf Process Manage 60(1):103154","journal-title":"Inf Process Manage"},{"key":"18359_CR43","doi-asserted-by":"crossref","unstructured":"Xu W, Callison-Burch C, Dolan WB (2015) Semeval-2015 task 1: Paraphrase and semantic similarity in Twitter (pit). In: Proceedings of the 9th International Workshop on semantic evaluation (SemEval 2015), pp 1\u201311","DOI":"10.18653\/v1\/S15-2001"},{"key":"18359_CR44","doi-asserted-by":"publisher","first-page":"435","DOI":"10.1162\/tacl_a_00194","volume":"2","author":"W Xu","year":"2014","unstructured":"Xu W, Ritter A, Callison-Burch C, Dolan WB, Ji Y (2014) Extracting lexically divergent paraphrases from Twitter. Trans Assoc Comput Linguis 2:435\u2013448","journal-title":"Trans Assoc Comput Linguis"},{"issue":"2","key":"18359_CR45","doi-asserted-by":"publisher","first-page":"103186","DOI":"10.1016\/j.ipm.2022.103186","volume":"60","author":"M Yang","year":"2023","unstructured":"Yang M, Chen X, Tan L, Lan X, Luo Y (2023) Listen carefully to experts when you classify data: A generic data classification ontology encoded from regulations. Inf Process Manage 60(2):103186","journal-title":"Inf Process Manage"},{"key":"18359_CR46","doi-asserted-by":"crossref","unstructured":"Yin W, Sch\u00fctze H (2015) Convolutional neural network for paraphrase identification. In: Proceedings of the 2015 conference of the north American chapter of the association for computational linguistics: human language technologies, pp 901\u2013911","DOI":"10.3115\/v1\/N15-1091"},{"key":"18359_CR47","doi-asserted-by":"crossref","unstructured":"Zarrella G, Henderson J, Merkhofer E, Strickhart L (2015) Mitre: Seven systems for semantic similarity in tweets. In: Proceedings of the 9th international workshop on semantic evaluation (SemEval 2015), pp 12\u201317","DOI":"10.18653\/v1\/S15-2002"},{"key":"18359_CR48","doi-asserted-by":"crossref","unstructured":"Zhao J, Lan M (2015) Ecnu: Leveraging word embeddings to boost performance for paraphrase on Twitter. In: Proceedings of the 9th international workshop on semantic evaluation (SemEval 2015), pp 34\u201339","DOI":"10.18653\/v1\/S15-2006"},{"key":"18359_CR49","doi-asserted-by":"crossref","unstructured":"Palivela H (2021) Optimization of paraphrase generation and identification using language models in natural language processing. Int J Inf Manag Data Insights\u00a01(2):100025","DOI":"10.1016\/j.jjimei.2021.100025"}],"container-title":["Multimedia Tools and Applications"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-024-18359-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11042-024-18359-w\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11042-024-18359-w.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,9,3]],"date-time":"2024-09-03T02:17:50Z","timestamp":1725329870000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11042-024-18359-w"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,2,15]]},"references-count":49,"journal-issue":{"issue":"30","published-online":{"date-parts":[[2024,9]]}},"alternative-id":["18359"],"URL":"https:\/\/doi.org\/10.1007\/s11042-024-18359-w","relation":{},"ISSN":["1573-7721"],"issn-type":[{"value":"1573-7721","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,2,15]]},"assertion":[{"value":"10 February 2023","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"21 October 2023","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"19 January 2024","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 February 2024","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"All procedures performed in studies involving human participants were per the ethical standards of the institutional and\/or national research committee and with the 1964 Helsinki Declaration and its later amendments or comparable ethical standards.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Ethical approval"}},{"value":"N\/A.","order":3,"name":"Ethics","group":{"name":"EthicsHeading","label":"Informed consent"}},{"value":"All authors declare that they have no conflict of interest.","order":4,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}