{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,17]],"date-time":"2025-10-17T14:12:36Z","timestamp":1760710356994},"reference-count":31,"publisher":"Springer Science and Business Media LLC","issue":"4","license":[{"start":{"date-parts":[[2020,9,16]],"date-time":"2020-09-16T00:00:00Z","timestamp":1600214400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2020,9,16]],"date-time":"2020-09-16T00:00:00Z","timestamp":1600214400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Speech Technol"],"published-print":{"date-parts":[[2020,12]]},"DOI":"10.1007\/s10772-020-09753-4","type":"journal-article","created":{"date-parts":[[2020,9,16]],"date-time":"2020-09-16T09:03:54Z","timestamp":1600247034000},"page":"851-859","update-policy":"http:\/\/dx.doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":12,"title":["Factors affecting sentence similarity and paraphrasing identification"],"prefix":"10.1007","volume":"23","author":[{"given":"Marwah","family":"Alian","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Arafat","family":"Awajan","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2020,9,16]]},"reference":[{"key":"9753_CR1","doi-asserted-by":"publisher","first-page":"42740","DOI":"10.1109\/ACCESS.2018.2852648","volume":"6","author":"M Alhawarat","year":"2018","unstructured":"Alhawarat, M., & Hegazi, M. (2018). Revisiting KMeans and topic modeling, a comparison study to cluster arabic documents. IEEE Access, 6, 42740\u201342749.","journal-title":"IEEE Access"},{"key":"9753_CR31","unstructured":"Alian, M., & Awajan, A. (2020). Evaluating Factors affecting sentences similarity and paraphrasing identification using K-means clustering. In The 35th International Business Information Management Association (35th IBIMA) (pp. 952\u2013959)."},{"key":"9753_CR2","doi-asserted-by":"crossref","unstructured":"Alian, M., & Awajan, A. (2018). Semantic similarity approaches\u2014Review. In 2018 international arab conference on information technology (ACIT2018), Werdanye, Lebanon (pp. 1\u20136).","DOI":"10.1109\/ACIT.2018.8672665"},{"key":"9753_CR3","doi-asserted-by":"crossref","unstructured":"Alian, M., Awajan, A., Al-Hasan, A., & Akuzhia, R. (2019). Towards building Arabic paraphrasing benchmark. In The second international conference on data science, E-learning and information systems (DATA\u2019 2019), Dubai.","DOI":"10.1145\/3368691.3368708"},{"key":"9753_CR4","unstructured":"Alkholi, M. A. (2001). Semantics-\u00a0Elm AldlAlAh (Elm AlmEnY)(Vol.\u00a01). Amman: dar Al-falah."},{"key":"9753_CR5","unstructured":"Al-Kholi, M. A. (1999).\u00a0Transformation rules for Arabic language. Jordan: dar Al-Falah."},{"issue":"2","key":"9753_CR6","doi-asserted-by":"publisher","first-page":"5","DOI":"10.5120\/8012-0675","volume":"51","author":"M Alkoffash","year":"2012","unstructured":"Alkoffash, M. (2012). Automatic arabic text clustering using K-means and K-mediods. International Journal of Computer Applications, 51(2), 5\u20138.","journal-title":"International Journal of Computer Applications"},{"key":"9753_CR7","unstructured":"Awajan, M., & Alian, A. (2020). Paraphrasing identification techniques in English and Arabic texts. In The 11th international conference on information and communication systems, Irbid, Jordan (pp. 155\u2013160)."},{"key":"9753_CR8","doi-asserted-by":"publisher","first-page":"135","DOI":"10.1162\/tacl_a_00051","volume":"5","author":"P Bojanowski","year":"2017","unstructured":"Bojanowski, P., Grave, E., Joulin, A., & Mikolov, T. (2017). Enriching word vectors with subword information. Transactions of the Association for Computational Linguistics, 5, 135\u2013146.","journal-title":"Transactions of the Association for Computational Linguistics"},{"key":"9753_CR9","doi-asserted-by":"crossref","unstructured":"Bsoul, Q. W., & Mohd, M. (2011). Effect of ISRI stemming on similarity measure for arabic document clustering. In Asia information retrieval symposium (pp. 584\u2013593).","DOI":"10.1007\/978-3-642-25631-8_53"},{"key":"9753_CR10","doi-asserted-by":"publisher","DOI":"10.1515\/9783112316009","volume-title":"Syntactic structure","author":"N Chomsky","year":"1957","unstructured":"Chomsky, N. (1957). Syntactic structure. Paris: Mouton Publishers."},{"key":"9753_CR11","unstructured":"Fernando, S., & Stevenson, M. (2008). A semantic similarity approach to paraphrase detection. In The 11th annual research colloquium of the UK special interest group for computational linguistics."},{"key":"9753_CR12","doi-asserted-by":"crossref","unstructured":"Froud, H., & Lachkar, A. (2013). Agglomerative hierarchical clustering techniques for arabic documents. In Advances in computational science, engineering and information technology. Advances in intelligent systems and computing (Vol. 225). Heidelberg: Springer.","DOI":"10.1007\/978-3-319-00951-3_25"},{"key":"9753_CR13","unstructured":"Grave, E., Bojanowski, P., Gupta, P., Joulin, A., & Mikolov, T. (2018). Learning word vectors for 157 languages. In Proceedings of the international conference on language resources and evaluation (LREC 2018)."},{"key":"9753_CR14","unstructured":"Hussein, M., Alsammak, A., & Elshishtawy, T. (2016) In The 10th international conference on informatics and systems (pp. 61\u201367)."},{"issue":"3","key":"9753_CR15","doi-asserted-by":"publisher","first-page":"640","DOI":"10.1016\/j.ipm.2017.01.002","volume":"53","author":"M Jaradat","year":"2017","unstructured":"Jaradat, M., Al-Ayyoub, Z., Jararweh, M., & Al-Smadi, Y. (2017). Paraphrase identification and semantic text similarity analysis in Arabic news tweets using lexical, syntactic, and semantic features. Information Processing and Management, 53(3), 640\u2013652.","journal-title":"Information Processing and Management"},{"key":"9753_CR16","unstructured":"Jarim, A., & Ali, M. (2004). Clear Syntax for Arabic Grammar (AlnHw AlwADH fy qwAEd AllgAh AlErbyAh) (2nd ed.). Riyadh: Egyptian and Saudi dar for Publishing."},{"key":"9753_CR17","volume-title":"Artificial intelligence with python","author":"P Joshi","year":"2017","unstructured":"Joshi, P. (2017). Artificial intelligence with python. Birmingham, UK: Packt Publishing Ltd."},{"key":"9753_CR18","unstructured":"Klavans, J., Eskin, E., & Hatzivassiloglou, V. (1999). Detecting text similarity over short passages: Exploring linguistic feature combinations via machine learning. In SIGDAT conference: empirical methods in NLP and very large corpora (pp. 204\u2013212)."},{"key":"9753_CR19","unstructured":"Lintean, C. M., & Rus, V. (2012). Measuring semantic similarity in short texts through greedy pairing and word semantics. In The twenty-fifth international florida artificial intelligence research society conference (pp. 244\u2013249)."},{"issue":"2","key":"9753_CR20","first-page":"208","volume":"10","author":"EL Lydia","year":"2018","unstructured":"Lydia, E. L., Govindaswamy, P., Lakshmanaprabu, S., & Ramya, D. (2018). Document clustering based on text mining K-means algorithm using euclidean distance similarity. Journal of Advanced Research in Dynamical and Control Systems, 10(2), 208\u2013214.","journal-title":"Journal of Advanced Research in Dynamical and Control Systems"},{"key":"9753_CR21","doi-asserted-by":"publisher","first-page":"256","DOI":"10.1016\/j.procs.2017.10.117","volume":"117","author":"ABS Mohammad","year":"2017","unstructured":"Mohammad, A. B. S., Eissa, K., & El-Beltagy, S. R. (2017). AraVec: A set of arabic word embedding models for use in arabic NLP. Procedia Computer Science, 117, 256\u2013265.","journal-title":"Procedia Computer Science"},{"key":"9753_CR22","doi-asserted-by":"crossref","unstructured":"Mohsen, G., Al-Ayyoub, M., Hmeidi, I., & Al-Aiad, A. (2018). On the automatic construction of an arabic thesaurus. In 9th international conference on information and communication systems (ICICS).","DOI":"10.1109\/IACS.2018.8355431"},{"issue":"31","key":"9753_CR23","doi-asserted-by":"publisher","first-page":"975","DOI":"10.5120\/ijca2018918234","volume":"182","author":"S Naeem","year":"2018","unstructured":"Naeem, S., & Wumaier, A. (2018). Study and implementing K-mean clustering algorithm on english text and techniques to find the optimal value of K. International Journal of Computer Applications, 182(31), 975\u20138887.","journal-title":"International Journal of Computer Applications"},{"key":"9753_CR24","doi-asserted-by":"crossref","unstructured":"Nagoudi, E. M. B., Ferrero, J., & Schwab, D. (2017). LIM-LIG at SemEval-2017 task1: Enhancing the semantic similarity for arabic sentences with vectors weighting. In 11th international workshop semantic evaluation (SemEval 2017) (pp. 134\u2013138).","DOI":"10.18653\/v1\/S17-2017"},{"key":"9753_CR25","unstructured":"Omar, A. M. (1420\u20131999).\u00a0Language excercises and grammar (Vol. 2). Kuwait: Kuwait University."},{"key":"9753_CR26","volume-title":"\u0639\u0644\u0645 \u0627\u0644\u062f\u0644\u0627\u0644\u0629 semantics -Elm AldlAlAh","author":"AM Omar","year":"1998","unstructured":"Omar, A. M. (1998).\u00a0Semantics -Elm AldlAlAh (5th ed.). Cairo, Egypt: Book World.","edition":"5"},{"key":"9753_CR27","unstructured":"Oshea, F. A., Bandar, J. D., Crockett, Z., & Almarsoomi, K. (2013). AWSS: An algorithm for measuring arabic word semantic similarity. In 2013 IEEE international conference on systems, man, and cybernetics (pp. 504\u2013509)."},{"key":"9753_CR28","unstructured":"Rahaman, I., & Hosein, P. (2017). Exploiting Gaussian word embeddings for document clustering. In Future technologies conference (FTC) (pp. 1015\u20131018)."},{"issue":"21","key":"9753_CR29","first-page":"2497","volume":"97","author":"HRH Soliman","year":"2019","unstructured":"Soliman, H. R. H., Grida, M., & Hassan, M. (2019). Arabic text custering based on K-means algorithm with semantic word embedding. Journal of Theoretical and Applied Information Technology, 97(21), 2497\u20132509.","journal-title":"Journal of Theoretical and Applied Information Technology"},{"issue":"9","key":"9753_CR30","doi-asserted-by":"publisher","first-page":"0975","DOI":"10.5120\/ijca2017913757","volume":"163","author":"S Srivastava","year":"2017","unstructured":"Srivastava, S., & Govilkar, S. (2017). A survey on paraphrase detection techniques for Indian regional languages. International Journal of Computer Applications, 163(9), 0975\u20138887.","journal-title":"International Journal of Computer Applications"}],"container-title":["International Journal of Speech Technology"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-020-09753-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s10772-020-09753-4\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s10772-020-09753-4.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2021,9,16]],"date-time":"2021-09-16T00:11:19Z","timestamp":1631751079000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s10772-020-09753-4"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,9,16]]},"references-count":31,"journal-issue":{"issue":"4","published-print":{"date-parts":[[2020,12]]}},"alternative-id":["9753"],"URL":"https:\/\/doi.org\/10.1007\/s10772-020-09753-4","relation":{},"ISSN":["1381-2416","1572-8110"],"issn-type":[{"value":"1381-2416","type":"print"},{"value":"1572-8110","type":"electronic"}],"subject":[],"published":{"date-parts":[[2020,9,16]]},"assertion":[{"value":"24 February 2020","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"3 September 2020","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"16 September 2020","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}