{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,31]],"date-time":"2026-03-31T09:05:30Z","timestamp":1774947930135,"version":"3.50.1"},"reference-count":42,"publisher":"Springer Science and Business Media LLC","issue":"12","license":[{"start":{"date-parts":[[2022,4,28]],"date-time":"2022-04-28T00:00:00Z","timestamp":1651104000000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2022,4,28]],"date-time":"2022-04-28T00:00:00Z","timestamp":1651104000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Scientometrics"],"published-print":{"date-parts":[[2022,12]]},"DOI":"10.1007\/s11192-022-04380-z","type":"journal-article","created":{"date-parts":[[2022,4,28]],"date-time":"2022-04-28T05:02:48Z","timestamp":1651122168000},"page":"7061-7075","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":11,"title":["Constructing a high-quality dataset for automated creation of summaries of fundamental contributions of research articles"],"prefix":"10.1007","volume":"127","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-7088-9752","authenticated-orcid":false,"given":"Haihua","family":"Chen","sequence":"first","affiliation":[]},{"given":"Huyen","family":"Nguyen","sequence":"additional","affiliation":[]},{"given":"Asmaa","family":"Alghamdi","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2022,4,28]]},"reference":[{"key":"4380_CR1","first-page":"5","volume":"2012","author":"M Angrosh","year":"2012","unstructured":"Angrosh, M., Cranefield, S., & Stanger, N. (2012). A citation centric annotation scheme for scientific articles. Proceedings of the Australasian Language Technology Association Workshop, 2012, 5\u201314.","journal-title":"Proceedings of the Australasian Language Technology Association Workshop"},{"key":"4380_CR2","doi-asserted-by":"crossref","unstructured":"Auer, S., Kovtun, V., Prinz, M., Kasprzik, A., Stocker, M., & Vidal, M. E. (2018). Towards a knowledge graph for science. In Proceedings of the 8th International Conference on Web Intelligence, Mining and Semantics, (pp 1\u20136).","DOI":"10.1145\/3227609.3227689"},{"key":"4380_CR3","doi-asserted-by":"crossref","unstructured":"Beltagy, I., Lo, K., & Cohan, A. (2019). Scibert: A pretrained language model for scientific text. arXiv preprint arXiv:1903.10676.","DOI":"10.18653\/v1\/D19-1371"},{"issue":"2","key":"4380_CR4","first-page":"249","volume":"22","author":"J Carletta","year":"1996","unstructured":"Carletta, J. (1996). Assessing agreement on classification tasks: The kappa statistic. Computational Linguistics, 22(2), 249\u2013254.","journal-title":"Computational Linguistics"},{"key":"4380_CR5","doi-asserted-by":"crossref","unstructured":"Chakravarthi, B.R. (2021). Domain identification of scientific articles using transfer learning and ensembles. In Trends and Applications in Knowledge Discovery and Data Mining: PAKDD 2021 Workshops, WSPA, MLMEIN, SDPRA, DARAI, and AI4EPT, Delhi, India, May 11, 2021 Proceedings, (vol 12705, p. 88). Springer Nature.","DOI":"10.1007\/978-3-030-75015-2_9"},{"key":"4380_CR6","doi-asserted-by":"publisher","first-page":"321","DOI":"10.1613\/jair.953","volume":"16","author":"NV Chawla","year":"2002","unstructured":"Chawla, N. V., Bowyer, K. W., Hall, L. O., & Kegelmeyer, W. P. (2002). Smote: synthetic minority over-sampling technique. Journal of artificial intelligence research, 16, 321\u2013357.","journal-title":"Journal of artificial intelligence research"},{"key":"4380_CR7","unstructured":"Chen, H., & Kanuboddu, B. N. (2021). A fine-grained annotation scheme for research contribution in academic literature. In Proceedings of the 18th International Conference on Scientometrics and Informetrics, (pp 241\u2013248)."},{"issue":"2","key":"4380_CR8","doi-asserted-by":"publisher","first-page":"831","DOI":"10.1109\/TR.2021.3070863","volume":"70","author":"H Chen","year":"2021","unstructured":"Chen, H., Chen, J., & Ding, J. (2021). Data evaluation and enhancement for quality improvement of machine learning. IEEE Transactions on Reliability, 70(2), 831\u2013847.","journal-title":"IEEE Transactions on Reliability"},{"issue":"2","key":"4380_CR9","doi-asserted-by":"publisher","first-page":"102798","DOI":"10.1016\/j.ipm.2021.102798","volume":"59","author":"H Chen","year":"2022","unstructured":"Chen, H., Wu, L., Chen, J., Lu, W., & Ding, J. (2022). A comparative study of automated legal text classification using random forests and deep learning. Information Processing & Management, 59(2), 102798.","journal-title":"Information Processing & Management"},{"issue":"2","key":"4380_CR10","first-page":"16","volume":"4","author":"RA Day","year":"1989","unstructured":"Day, R. A., et al. (1989). The origins of the scientific paper: the imrad format. Journal of the American Medical Directors Association, 4(2), 16\u201318.","journal-title":"Journal of the American Medical Directors Association"},{"key":"4380_CR11","unstructured":"D\u2019Souza, J., & Auer, S. (2020). Nlpcontributions: An annotation scheme for machine reading of scholarly contributions in natural language processing literature. In EEKE@JCDL\u201920 - Workshop on Extraction and Evaluation of Knowledge Entities from Scientific Documents."},{"issue":"2","key":"4380_CR12","doi-asserted-by":"publisher","first-page":"463","DOI":"10.1007\/s11135-014-0003-1","volume":"49","author":"R Falotico","year":"2015","unstructured":"Falotico, R., & Quatto, P. (2015). Fleiss\u2019 kappa statistic without paradoxes. Quality & Quantity, 49(2), 463\u2013470.","journal-title":"Quality & Quantity"},{"issue":"1","key":"4380_CR13","first-page":"3133","volume":"15","author":"M Fern\u00e1ndez-Delgado","year":"2014","unstructured":"Fern\u00e1ndez-Delgado, M., Cernadas, E., Barro, S., & Amorim, D. (2014). Do we need hundreds of classifiers to solve real world classification problems? The Journal of Machine Learning Research, 15(1), 3133\u20133181.","journal-title":"The Journal of Machine Learning Research"},{"key":"4380_CR14","unstructured":"Fisas B, Ronzano F, Saggion H (2016) A multi-layered annotated corpus of scientific papers. In Proceedings of the Tenth International Conference on Language Resources and Evaluation (LREC\u201916), (pp. 3081\u20133088)."},{"key":"4380_CR15","first-page":"261","volume":"2020","author":"W Hao","year":"2020","unstructured":"Hao, W., Li, Z., Qian, Y., Wang, Y., & Zhang, C. (2020). The acl fws-rc: A dataset for recognition and classification of sentence about future works. Proceedings of the ACM\/IEEE Joint Conference on Digital Libraries in, 2020, 261\u2013269.","journal-title":"Proceedings of the ACM\/IEEE Joint Conference on Digital Libraries in"},{"key":"4380_CR16","volume-title":"Scientific writing and communication: papers, proposals, and presentations","author":"AH Hofmann","year":"2016","unstructured":"Hofmann, A. H. (2016). Scientific writing and communication: papers, proposals, and presentations (3rd ed.). Oxford, United Kingdom: Oxford University Press.","edition":"3"},{"issue":"1","key":"4380_CR17","first-page":"13","volume":"22","author":"E Hovy","year":"2010","unstructured":"Hovy, E., & Lavid, J. (2010). Towards a \u2018science\u2019of corpus annotation: a new methodological challenge for corpus linguistics. International Journal of Translation, 22(1), 13\u201336.","journal-title":"International Journal of Translation"},{"key":"4380_CR18","doi-asserted-by":"crossref","unstructured":"Jaradeh, M.Y., Oelen, A., Farfar, K.E., Prinz, M., D\u2019Souza, J., Kismih\u00f3k, G., Stocker, M., & Auer, S. (2019). Open research knowledge graph: Next generation infrastructure for semantic scholarly knowledge. In Proceedings of the 10th International Conference on Knowledge Capture, ACM, (pp. 243-246), https:\/\/dl.acm.org\/doi\/10.1145\/3360901.3364435.","DOI":"10.1145\/3360901.3364435"},{"issue":"1","key":"4380_CR19","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1186\/1478-4505-10-21","volume":"10","author":"MO Kok","year":"2012","unstructured":"Kok, M. O., & Schuit, A. J. (2012). Contribution mapping: A method for mapping the contribution of research to enhance its impact. Health Research Policy and Systems, 10(1), 1\u201316.","journal-title":"Health Research Policy and Systems"},{"issue":"4","key":"4380_CR20","doi-asserted-by":"publisher","first-page":"150","DOI":"10.3390\/info10040150","volume":"10","author":"K Kowsari","year":"2019","unstructured":"Kowsari, K., Jafari Meimandi, K., Heidarysafa, M., Mendu, S., Barnes, L., & Brown, D. (2019). Text classification algorithms: A survey. Information, 10(4), 150.","journal-title":"Information"},{"issue":"4","key":"4380_CR21","doi-asserted-by":"publisher","first-page":"26","DOI":"10.2478\/jdis-2019-0019","volume":"4","author":"X Le","year":"2019","unstructured":"Le, X., Chu, J., Deng, S., Jiao, Q., Pei, J., Zhu, L., & Yao, J. (2019). Citeopinion: Evidence-based evaluation tool for academic contributions of research papers based on citing sentences. Journal of Data and Information Science, 4(4), 26\u201341.","journal-title":"Journal of Data and Information Science"},{"key":"4380_CR22","unstructured":"Li, Q., Peng, H., Li, J., Xia, C., Yang, R., Sun, L., Yu, P. S., & He, L. (2020). A survey on text classification: From shallow to deep learning. arXiv preprint arXiv:2008.00364."},{"key":"4380_CR23","unstructured":"Lindsay, D. (1995). Scientific Writing. Longman Cheshire."},{"key":"4380_CR24","unstructured":"Mehta, P., Arora, G., & Majumder, P. (2018). Attention based sentence extraction from scientific articles using pseudo-labeled data. CoRR arXiv:1802.04675"},{"key":"4380_CR25","unstructured":"Mikolov, T., Chen, K., Corrado, G., & Dean, J. (2013). Efficient estimation of word representations in vector space. arXiv preprint arXiv:1301.3781."},{"issue":"4","key":"4380_CR26","doi-asserted-by":"publisher","first-page":"405","DOI":"10.1093\/reseval\/rvv016","volume":"24","author":"S Morton","year":"2015","unstructured":"Morton, S. (2015). Progressing research impact assessment: A \u2018contributions\u2019 approach. Research Evaluation, 24(4), 405\u2013419.","journal-title":"Research Evaluation"},{"key":"4380_CR27","unstructured":"nd (2022a) Annual meeting of the association for computational linguistics (acl). Retrieved February 18, 2022, from https:\/\/aclanthology.org\/venues\/acl\/"},{"key":"4380_CR28","unstructured":"nd (2022b) Information processing & management. Retrieved February 18, 2022, from https:\/\/www.journals.elsevier.com\/information-processing-and-management"},{"key":"4380_CR29","unstructured":"Oelen, A., Jaradeh, M. Y., Farfar, K. E., Stocker, M., & Auer, S. (2019). Comparing research contributions in a scholarly knowledge graph. In CEUR Workshop Proceedings 2526 (2019), (vol 2526, pp. 21\u201326). Aachen: RWTH Aachen."},{"key":"4380_CR30","doi-asserted-by":"crossref","unstructured":"Park, S., & Caragea, C. (2020). Scientific keyphrase identification and classification by pre-trained language models intermediate task transfer learning. In Proceedings of the 28th International Conference on Computational Linguistics, (pp. 5409\u20135419).","DOI":"10.18653\/v1\/2020.coling-main.472"},{"key":"4380_CR31","doi-asserted-by":"publisher","DOI":"10.1002\/9781118708019","volume-title":"Scientific writing: Easy when you know how","author":"J Peat","year":"2002","unstructured":"Peat, J., Elliott, E., Baur, L., & Keena, V. (2002). Scientific writing: Easy when you know how (1st ed.). London, United Kingdom: BMJ Books.","edition":"1"},{"key":"4380_CR32","unstructured":"QasemiZadeh, B., & Handschuh, S. (2014). The acl rd-tec: a dataset for benchmarking terminology extraction and classification in computational linguistics. In Proceedings of the 4th International Workshop on Computational Terminology (Computerm), (pp. 52\u201363)."},{"key":"4380_CR33","unstructured":"Rehman, T., Sanyal, D. K., Chattopadhyay, S., Bhowmick, P. K., & Das, P. P. (2021). Automatic generation of research highlights from scientific abstracts. In EEKE@JCDL\u201921 - Workshop on Extraction and Evaluation of Knowledge Entities from Scientific Documents."},{"key":"4380_CR34","doi-asserted-by":"crossref","unstructured":"Sateli, B., & Witte, R. (2015). What\u2019s in this paper? combining rhetorical entities with linked open data for semantic literature querying. In Proceedings of the 24th International Conference on World Wide Web, (pp. 1023\u20131028).","DOI":"10.1145\/2740908.2742022"},{"key":"4380_CR35","doi-asserted-by":"crossref","unstructured":"Shen, Y., & Liu, J. (2021). Comparison of text sentiment analysis based on bert and word2vec. In 2021 IEEE 3rd International Conference on Frontiers Technology of Information and Computer (ICFTIC), IEEE, (pp. 144\u2013147).","DOI":"10.1109\/ICFTIC54370.2021.9647258"},{"issue":"3","key":"4380_CR36","first-page":"364","volume":"92","author":"LB Sollaci","year":"2004","unstructured":"Sollaci, L. B., & Pereira, M. G. (2004). The introduction, methods, results, and discussion (imrad) structure: A fifty-year survey. Journal of the Medical Library Association, 92(3), 364.","journal-title":"Journal of the Medical Library Association"},{"key":"4380_CR37","unstructured":"Swales, J. (1990). Genre analysis: English in academic and research settings. Cambridge University Press."},{"key":"4380_CR38","doi-asserted-by":"crossref","unstructured":"Swales, J. M. (2011). Aspects of article introductions, michigan (classics). University of Michigan Press.","DOI":"10.3998\/mpub.3985899"},{"key":"4380_CR39","doi-asserted-by":"crossref","unstructured":"Teufel, S., Siddharthan, A., & Tidhar, D. (2006). An annotation scheme for citation function. In Proceedings of the 7th SIGdial Workshop on Discourse and Dialogue, (pp. 80\u201387).","DOI":"10.3115\/1654595.1654612"},{"key":"4380_CR40","first-page":"107","volume":"2020","author":"L Vogt","year":"2020","unstructured":"Vogt, L., D\u2019Souza, J., Stocker, M., & Auer, S. (2020). Toward representing research contributions in scholarly knowledge graphs using knowledge graph cells. Proceedings of the ACM\/IEEE Joint Conference on Digital Libraries in, 2020, 107\u2013116.","journal-title":"Proceedings of the ACM\/IEEE Joint Conference on Digital Libraries in"},{"key":"4380_CR41","doi-asserted-by":"crossref","unstructured":"Wang, W. M., See-To, E. W. K., Lin, H. T., & Li, Z. (2018). Comparison of automatic extraction of research highlights and abstracts of journal articles. In Proceedings of the 2nd International Conference on Computer Science and Application Engineering, (pp. 1\u20135).","DOI":"10.1145\/3207677.3277979"},{"key":"4380_CR42","unstructured":"Weng, W.H., Deaton, J., Natarajan, V., Elsayed, G. F., & Liu, Y. (2020). Addressing the real-world class imbalance problem in dermatology. In Machine Learning for Health, PMLR, (pp. 415\u2013429)."}],"container-title":["Scientometrics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11192-022-04380-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11192-022-04380-z\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11192-022-04380-z.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,12,5]],"date-time":"2022-12-05T05:17:57Z","timestamp":1670217477000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11192-022-04380-z"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,4,28]]},"references-count":42,"journal-issue":{"issue":"12","published-print":{"date-parts":[[2022,12]]}},"alternative-id":["4380"],"URL":"https:\/\/doi.org\/10.1007\/s11192-022-04380-z","relation":{},"ISSN":["0138-9130","1588-2861"],"issn-type":[{"value":"0138-9130","type":"print"},{"value":"1588-2861","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,4,28]]},"assertion":[{"value":"31 October 2021","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"9 April 2022","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"28 April 2022","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}