{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,5]],"date-time":"2026-06-05T10:57:43Z","timestamp":1780657063222,"version":"3.54.1"},"reference-count":63,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2022,7,20]],"date-time":"2022-07-20T00:00:00Z","timestamp":1658275200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2022,7,20]],"date-time":"2022-07-20T00:00:00Z","timestamp":1658275200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"funder":[{"name":"Elsevier Center of Excellence for Natural Language Processing"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Digit Libr"],"published-print":{"date-parts":[[2022,9]]},"DOI":"10.1007\/s00799-022-00329-y","type":"journal-article","created":{"date-parts":[[2022,7,20]],"date-time":"2022-07-20T11:06:05Z","timestamp":1658315165000},"page":"289-301","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":63,"title":["ScienceQA: a novel resource for question answering on scholarly articles"],"prefix":"10.1007","volume":"23","author":[{"given":"Tanik","family":"Saikh","sequence":"first","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Tirthankar","family":"Ghosal","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Amish","family":"Mittal","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Asif","family":"Ekbal","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Pushpak","family":"Bhattacharyya","sequence":"additional","affiliation":[],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"297","published-online":{"date-parts":[[2022,7,20]]},"reference":[{"key":"329_CR1","doi-asserted-by":"publisher","unstructured":"Amini, A., Gabriel, S., Lin, S., Koncel-Kedziorski, R., Choi, Y., Hajishirzi, H.: MathQA: towards interpretable math word problem solving with operation-based formalisms. In: Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers), pp. 2357\u20132367. Association for Computational Linguistics, Minneapolis, Minnesota (2019). https:\/\/doi.org\/10.18653\/v1\/N19-1245","DOI":"10.18653\/v1\/N19-1245"},{"key":"329_CR2","doi-asserted-by":"crossref","unstructured":"Beltagy, I., Cohan, A., Feigenblat, G., Freitag, D., Ghosal, T., Hall, K., Herrmannova, D., Knoth, P., Lo, K., Mayr, P., Patton, R., Shmueli-Scheuer, M., de\u00a0Waard, A., Wang, K., Wang, L.: Overview of the second workshop on scholarly document processing. In: Proceedings of the Second Workshop on Scholarly Document Processing, pp. 159\u2013165. Association for Computational Linguistics, Online (2021). https:\/\/aclanthology.org\/2021.sdp-1.22","DOI":"10.18653\/v1\/2020.sdp-1.1"},{"key":"329_CR3","doi-asserted-by":"publisher","unstructured":"Beltagy, I., Lo, K., Cohan, A.: SciBERT: A pretrained language model for scientific text. In: Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (EMNLP-IJCNLP), pp. 3615\u20133620. Association for Computational Linguistics, Hong Kong, China (2019). https:\/\/doi.org\/10.18653\/v1\/D19-1371","DOI":"10.18653\/v1\/D19-1371"},{"key":"329_CR4","doi-asserted-by":"crossref","unstructured":"Bjerva, J., Bhutani, N., Golahn, B., Tan, W.C., Augenstein, I.: SubjQA: a dataset for subjectivity and review comprehension. In: Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing. Association for Computational Linguistics (2020)","DOI":"10.18653\/v1\/2020.emnlp-main.442"},{"key":"329_CR5","doi-asserted-by":"publisher","unstructured":"Bowman, S.R., Angeli, G., Potts, C., Manning, C.D.: A large annotated corpus for learning natural language inference. In: Proceedings of the 2015 Conference on Empirical Methods in Natural Language Processing, pp. 632\u2013642. Association for Computational Linguistics, Lisbon, Portugal (2015). https:\/\/doi.org\/10.18653\/v1\/D15-1075","DOI":"10.18653\/v1\/D15-1075"},{"key":"329_CR6","unstructured":"Chen, D.: Neural Reading Comprehension and Beyond. Ph.D. thesis, Stanford University (2018)"},{"key":"329_CR7","doi-asserted-by":"publisher","unstructured":"Chen, D., Bolton, J., Manning, C.D.: A Thorough examination of the cnn\/daily mail reading comprehension task. In: Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 2358\u20132367. Association for Computational Linguistics, Berlin, Germany (2016). https:\/\/doi.org\/10.18653\/v1\/P16-1223","DOI":"10.18653\/v1\/P16-1223"},{"key":"329_CR8","unstructured":"Chen, M., D\u2019Arcy, M., Liu, A., Fernandez, J., Downey, D.: CODAH: An adversarially-authored question answering dataset for common sense. In: Proceedings of the 3rd Workshop on Evaluating Vector Space Representations for NLP, pp. 63\u201369 (2019)"},{"key":"329_CR9","doi-asserted-by":"publisher","unstructured":"Chen, Q., Zhu, X., Ling, Z.H., Inkpen, D., Wei, S.: Neural natural language inference models enhanced with external knowledge. In: Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 2406\u20132417. Association for Computational Linguistics, Melbourne, Australia (2018). https:\/\/doi.org\/10.18653\/v1\/P18-1224","DOI":"10.18653\/v1\/P18-1224"},{"key":"329_CR10","doi-asserted-by":"publisher","unstructured":"Clark, C., Gardner, M.: Simple and effective multi-paragraph reading comprehension. In: Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 845\u2013855. Association for Computational Linguistics, Melbourne, Australia (2018). https:\/\/doi.org\/10.18653\/v1\/P18-1078","DOI":"10.18653\/v1\/P18-1078"},{"key":"329_CR11","unstructured":"Clark, P., Cowhey, I., Etzioni, O., Khot, T., Sabharwal, A., Schoenick, C., Tafjord, O.: Think you have solved question answering? Try ARC, the AI2 Reasoning Challenge. (2018) CoRR abs\/1803.05457http:\/\/arxiv.org\/abs\/1803.05457"},{"issue":"1","key":"329_CR12","first-page":"5","volume":"37","author":"P Clark","year":"2016","unstructured":"Clark, P., Etzioni, O.: My computer is an honor student\u2013but how intelligent is it? Standardized tests as a measure of AI. AI Mag. 37(1), 5\u201312 (2016)","journal-title":"AI Mag."},{"key":"329_CR13","unstructured":"Das, D., Katyal, Y., Verma, J., Dubey, S., Singh, A., Agarwal, K., Bhaduri, S., Ranjan, R.: Information retrieval and extraction on covid-19 clinical articles using graph community detection and bio-BERT embeddings. In: Proceedings of the 1st Workshop on NLP for COVID-19 at ACL 2020. Association for Computational Linguistics, Online (2020). https:\/\/aclanthology.org\/2020.nlpcovid19-acl.7"},{"key":"329_CR14","doi-asserted-by":"crossref","unstructured":"Denkowski, M., Lavie, A.: Meteor universal: language specific translation evaluation for any target language. In: Proceedings of the EACL 2014 Workshop on Statistical Machine Translation (2014)","DOI":"10.3115\/v1\/W14-3348"},{"key":"329_CR15","doi-asserted-by":"publisher","unstructured":"Devlin, J., Chang, M.W., Lee, K., Toutanova, K.: BERT: pre-training of deep bidirectional transformers for language understanding. In: Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers), pp. 4171\u20134186. Association for Computational Linguistics, Minneapolis, Minnesota (2019). https:\/\/doi.org\/10.18653\/v1\/N19-1423. https:\/\/www.aclweb.org\/anthology\/N19-1423","DOI":"10.18653\/v1\/N19-1423"},{"key":"329_CR16","doi-asserted-by":"publisher","unstructured":"Dhingra, B., Liu, H., Yang, Z., Cohen, W., Salakhutdinov, R.: Gated-attention readers for text comprehension. In: Proceedings of the 55th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 1832\u20131846. Association for Computational Linguistics, Vancouver, Canada (2017). https:\/\/doi.org\/10.18653\/v1\/P17-1168","DOI":"10.18653\/v1\/P17-1168"},{"key":"329_CR17","unstructured":"Dunn, M., Sagun, L., Higgins, M., G\u00fcney, V.U., Cirik, V., Cho, K.: SearchQA: a new Q &A dataset augmented with context from a search engine. CoRR abs\/1704.05179http:\/\/arxiv.org\/abs\/1704.05179 (2017)"},{"issue":"5","key":"329_CR18","doi-asserted-by":"publisher","first-page":"378","DOI":"10.1037\/h0031619","volume":"76","author":"JL Fleiss","year":"1971","unstructured":"Fleiss, J.L.: Measuring nominal scale agreement among many raters. Psychol. Bull. 76(5), 378 (1971)","journal-title":"Psychol. Bull."},{"key":"329_CR19","doi-asserted-by":"crossref","unstructured":"He, W., Liu, K., Liu, J., Lyu, Y., Zhao, S., Xiao, X., Liu, Y., Wang, Y., Wu, H., She, Q., Liu, X., Wu, T., Wang, H.: DuReader: A chinese machine reading comprehension dataset from real-world applications. In: Proceedings of the Workshop on Machine Reading for Question Answering, pp. 37\u201346. Association for Computational Linguistics, Melbourne, Australia (2018)","DOI":"10.18653\/v1\/W18-2605"},{"key":"329_CR20","unstructured":"Hermann, K.M., Kocisky, T., Grefenstette, E., Espeholt, L., Kay, W., Suleyman, M., Blunsom, P.: Teaching machines to read and comprehend. In: Advances in neural information processing systems, pp. 1693\u20131701 (2015)"},{"key":"329_CR21","unstructured":"Hill, F., Bordes, A., Chopra, S., Weston, J.: The Goldilocks Principle: Reading Children\u2019s Books with Explicit Memory Representations. arXiv preprint arXiv:1511.02301 (2015)"},{"key":"329_CR22","doi-asserted-by":"publisher","unstructured":"Hirschman, L., Light, M., Breck, E., Burger, J.D.: Deep read: a reading comprehension system. In: Proceedings of the 37th Annual Meeting of the Association for Computational Linguistics, pp. 325\u2013332. Association for Computational Linguistics, College Park, Maryland, USA (1999). https:\/\/doi.org\/10.3115\/1034678.1034731","DOI":"10.3115\/1034678.1034731"},{"key":"329_CR23","doi-asserted-by":"publisher","unstructured":"Huang, L., Le\u00a0Bras, R., Bhagavatula, C., Choi, Y.: Cosmos QA: Machine reading comprehension with contextual commonsense reasoning. In: Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (EMNLP-IJCNLP), pp. 2391\u20132401. Association for Computational Linguistics, Hong Kong, China (2019). https:\/\/doi.org\/10.18653\/v1\/D19-1243","DOI":"10.18653\/v1\/D19-1243"},{"key":"329_CR24","doi-asserted-by":"publisher","unstructured":"Jiang, K., Wu, D., Jiang, H.: FreebaseQA: a new factoid QA data set matching trivia-style question-answer pairs with freebase. In: Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers), pp. 318\u2013323. Association for Computational Linguistics, Minneapolis, Minnesota (2019). https:\/\/doi.org\/10.18653\/v1\/N19-1028","DOI":"10.18653\/v1\/N19-1028"},{"key":"329_CR25","doi-asserted-by":"crossref","unstructured":"Joshi, M., Choi, E., Weld, D.S., Zettlemoyer, L.: TriviaQA: A large scale distantly supervised challenge dataset for reading comprehension. In: Proceedings of the 55th Annual Meeting of the Association for Computational Linguistics. Association for Computational Linguistics, Vancouver, Canada (2017)","DOI":"10.18653\/v1\/P17-1147"},{"issue":"1","key":"329_CR26","doi-asserted-by":"publisher","DOI":"10.2196\/medinform.8751","volume":"6","author":"S Kim","year":"2018","unstructured":"Kim, S., Park, D., Choi, Y., Lee, K., Kim, B., Jeon, M., Kim, J., Tan, A.C., Kang, J.: A pilot study of biomedical text comprehension using an attention-based deep neural reader: design and experimental analysis. JMIR Med. Inf. 6(1), e2 (2018)","journal-title":"JMIR Med. Inf."},{"key":"329_CR27","doi-asserted-by":"publisher","first-page":"317","DOI":"10.1162\/tacl_a_00023","volume":"6","author":"T Ko\u010disk\u1ef3","year":"2018","unstructured":"Ko\u010disk\u1ef3, T., Schwarz, J., Blunsom, P., Dyer, C., Hermann, K.M., Melis, G., Grefenstette, E.: The NarrativeQA reading comprehension challenge. Trans. Assoc. Comput. Linguist. 6, 317\u2013328 (2018)","journal-title":"Trans. Assoc. Comput. Linguist."},{"key":"329_CR28","doi-asserted-by":"crossref","unstructured":"Kushman, N., Artzi, Y., Zettlemoyer, L., Barzilay, R.: Learning to automatically solve algebra word problems. In: Proceedings of the 52nd Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 271\u2013281 (2014)","DOI":"10.3115\/v1\/P14-1026"},{"key":"329_CR29","doi-asserted-by":"publisher","unstructured":"Lai, G., Xie, Q., Liu, H., Yang, Y., Hovy, E.: RACE: Large-scale ReAding comprehension dataset from examinations. In: Proceedings of the 2017 Conference on Empirical Methods in Natural Language Processing, pp. 785\u2013794. Association for Computational Linguistics, Copenhagen, Denmark (2017). https:\/\/doi.org\/10.18653\/v1\/D17-1082","DOI":"10.18653\/v1\/D17-1082"},{"key":"329_CR30","doi-asserted-by":"crossref","unstructured":"Landis, J.R., Koch, G.G.: The measurement of observer agreement for categorical data. Biometrics pp. 159\u2013174 (1977)","DOI":"10.2307\/2529310"},{"key":"329_CR31","unstructured":"Lin, C.Y.: ROUGE: A package for automatic evaluation of summaries. In: Text Summarization Branches Out, pp. 74\u201381. Association for Computational Linguistics, Barcelona, Spain (2004). https:\/\/aclanthology.org\/W04-1013"},{"key":"329_CR32","unstructured":"Nguyen, T., Rosenberg, M., Song, X., Gao, J., Tiwary, S., Majumder, R., Deng, L.: MS MARCO: A human generated machine reading comprehension dataset. In: Proceedings of the Workshop on Cognitive Computation: Integrating neural and symbolic approaches 2016 co-located with the 30th Annual Conference on Neural Information Processing Systems (NIPS 2016), Barcelona, Spain, December 9, 2016 (2016)"},{"key":"329_CR33","doi-asserted-by":"publisher","unstructured":"Papineni, K., Roukos, S., Ward, T., Zhu, W.J.: BLEU: a method for automatic evaluation of machine translation. In: Proceedings of the 40th Annual Meeting of the Association for Computational Linguistics, pp. 311\u2013318. Association for Computational Linguistics, Philadelphia, Pennsylvania, USA (2002). https:\/\/doi.org\/10.3115\/1073083.1073135","DOI":"10.3115\/1073083.1073135"},{"key":"329_CR34","unstructured":"Pappas, D., Androutsopoulos, I., Papageorgiou, H.: BioRead: a new dataset for biomedical reading comprehension. In: Proceedings of the Eleventh International Conference on Language Resources and Evaluation (LREC 2018). European Language Resources Association (ELRA), Miyazaki, Japan (2018). https:\/\/www.aclweb.org\/anthology\/L18-1439"},{"key":"329_CR35","doi-asserted-by":"publisher","first-page":"16246","DOI":"10.1109\/ACCESS.2019.2891666","volume":"7","author":"D Park","year":"2019","unstructured":"Park, D., Choi, Y., Kim, D., Yu, M., Kim, S., Kang, J.: Can machines learn to comprehend scientific literature? IEEE Access 7, 16246\u201316256 (2019)","journal-title":"IEEE Access"},{"key":"329_CR36","doi-asserted-by":"publisher","unstructured":"Rajpurkar, P., Jia, R., Liang, P.: Know what you don\u2019t know: unanswerable questions for squad. In: Proceedings of the 56th Annual Meeting of the Association for Computational Linguistics (Volume 2: Short Papers), pp. 784\u2013789. Association for Computational Linguistics, Melbourne, Australia (2018). https:\/\/doi.org\/10.18653\/v1\/P18-2124","DOI":"10.18653\/v1\/P18-2124"},{"key":"329_CR37","doi-asserted-by":"publisher","unstructured":"Rajpurkar, P., Zhang, J., Lopyrev, K., Liang, P.: SQuAD: 100,000+ questions for machine comprehension of text. In: Proceedings of the 2016 Conference on Empirical Methods in Natural Language Processing, pp. 2383\u20132392. Association for Computational Linguistics, Austin, Texas (2016). https:\/\/doi.org\/10.18653\/v1\/D16-1264","DOI":"10.18653\/v1\/D16-1264"},{"key":"329_CR38","doi-asserted-by":"publisher","first-page":"249","DOI":"10.1162\/tacl_a_00266","volume":"7","author":"S Reddy","year":"2019","unstructured":"Reddy, S., Chen, D., Manning, C.D.: CoQA: a conversational question answering challenge. Trans. Assoc. Comput. Linguist. 7, 249\u2013266 (2019)","journal-title":"Trans. Assoc. Comput. Linguist."},{"key":"329_CR39","doi-asserted-by":"crossref","unstructured":"Richardson, M., Burges, C.J., Renshaw, E.: MCTest: a challenge dataset for the open-domain machine comprehension of text. In: Proceedings of the 2013 Conference on Empirical Methods in Natural Language Processing, pp. 193\u2013203. Association for Computational Linguistics, Seattle, Washington, USA (2013). https:\/\/www.aclweb.org\/anthology\/D13-1020","DOI":"10.18653\/v1\/D13-1020"},{"key":"329_CR40","doi-asserted-by":"publisher","first-page":"842","DOI":"10.1162\/tacl_a_00349","volume":"8","author":"A Rogers","year":"2020","unstructured":"Rogers, A., Kovaleva, O., Rumshisky, A.: A primer in BERTology: what we know about how BERT works. Trans. Assoc. Comput. Linguist. 8, 842\u2013866 (2020)","journal-title":"Trans. Assoc. Comput. Linguist."},{"key":"329_CR41","unstructured":"Saikh, T., Ekbal, A., Bhattacharyya, P.: ScholarlyRead: a new dataset for scientific article reading comprehension. In: Proceedings of The 12th Language Resources and Evaluation Conference, pp. 5498\u20135504. European Language Resources Association, Marseille, France (2020). https:\/\/www.aclweb.org\/anthology\/2020.lrec-1.675"},{"key":"329_CR42","unstructured":"Sarkar, S.: Effectiveness of deep networks in NLP using BiDAF as an example architecture. arXiv preprint arXiv:2109.00074 (2021)"},{"key":"329_CR43","unstructured":"Seo, M., Kembhavi, A., Farhadi, A., Hajishirzi, H.: Bi-directional attention flow for machine comprehension. arXiv preprint arXiv:1611.01603 (2016)"},{"key":"329_CR44","doi-asserted-by":"publisher","first-page":"217","DOI":"10.1162\/tacl_a_00264","volume":"7","author":"K Sun","year":"2019","unstructured":"Sun, K., Yu, D., Chen, J., Yu, D., Choi, Y., Cardie, C.: DREAM: a challenge data set and models for dialogue-based reading comprehension. Trans. Assoc. Comput. Linguist. 7, 217\u2013231 (2019)","journal-title":"Trans. Assoc. Comput. Linguist."},{"key":"329_CR45","doi-asserted-by":"crossref","unstructured":"\u0160uster, S., Daelemans, W.: CliCR: a dataset of clinical case reports for machine reading comprehension. In: Proceedings of the 2018 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long Papers) (2018)","DOI":"10.18653\/v1\/N18-1140"},{"key":"329_CR46","doi-asserted-by":"publisher","unstructured":"Talmor, A., Herzig, J., Lourie, N., Berant, J.: CommonsenseQA: a question answering challenge targeting commonsense knowledge. In: Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long and Short Papers), pp. 4149\u20134158. Association for Computational Linguistics, Minneapolis, Minnesota (2019). https:\/\/doi.org\/10.18653\/v1\/N19-1421","DOI":"10.18653\/v1\/N19-1421"},{"key":"329_CR47","doi-asserted-by":"publisher","unstructured":"Trischler, A., Wang, T., Yuan, X., Harris, J., Sordoni, A., Bachman, P., Suleman, K.: NewsQA: a machine comprehension dataset. In: Proceedings of the 2nd Workshop on Representation Learning for NLP, pp. 191\u2013200. Association for Computational Linguistics, Vancouver, Canada (2017). https:\/\/doi.org\/10.18653\/v1\/W17-2623","DOI":"10.18653\/v1\/W17-2623"},{"key":"329_CR48","doi-asserted-by":"publisher","first-page":"138","DOI":"10.1186\/s12859-015-0564-6","volume":"16","author":"G Tsatsaronis","year":"2015","unstructured":"Tsatsaronis, G., Balikas, G., Malakasiotis, P., Partalas, I., Zschunke, M., Alvers, M.R., Weissenborn, D., Krithara, A., Petridis, S., Polychronopoulos, D., Almirantis, Y., Pavlopoulos, J., Baskiotis, N., Gallinari, P., Artieres, T., Ngonga, A., Heino, N., Gaussier, E., Barrio-Alvers, L., Schroeder, M., Androutsopoulos, I., Paliouras, G.: An overview of the BIOASQ large-scale biomedical semantic indexing and question answering competition. BMC Bioinf. 16, 138 (2015). https:\/\/doi.org\/10.1186\/s12859-015-0564-6","journal-title":"BMC Bioinf."},{"key":"329_CR49","doi-asserted-by":"publisher","unstructured":"Vedantam, R., Zitnick, C.L., Parikh, D.: CIDEr: consensus-based image description evaluation. In: 2015 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 4566\u20134575 (2015). https:\/\/doi.org\/10.1109\/CVPR.2015.7299087","DOI":"10.1109\/CVPR.2015.7299087"},{"key":"329_CR50","unstructured":"Verspoor, K., Cohen, K.B., Dredze, M., Ferrara, E., May, J., Munro, R., Paris, C., Wallace, B. (eds.): Proceedings of the 1st Workshop on NLP for COVID-19 at ACL 2020. Association for Computational Linguistics, Online (2020). https:\/\/aclanthology.org\/2020.nlpcovid19-acl.0"},{"key":"329_CR51","doi-asserted-by":"publisher","unstructured":"Voorhees, E.M., Tice, D.M.: Building a question answering test collection. In: Proceedings of the 23rd Annual International ACM SIGIR Conference on Research and Development in Information Retrieval, SIGIR \u201900, pp. 200\u2013207. ACM, New York, NY, USA (2000). https:\/\/doi.org\/10.1145\/345508.345577. http:\/\/doi.acm.org\/10.1145\/345508.345577","DOI":"10.1145\/345508.345577"},{"key":"329_CR52","doi-asserted-by":"publisher","first-page":"287","DOI":"10.1162\/tacl_a_00021","volume":"6","author":"J Welbl","year":"2018","unstructured":"Welbl, J., Stenetorp, P., Riedel, S.: Constructing datasets for multi-hop reading comprehension across documents. Trans. Assoc. Comput. Linguist. 6, 287\u2013302 (2018)","journal-title":"Trans. Assoc. Comput. Linguist."},{"key":"329_CR53","unstructured":"Weston, J., Bordes, A., Chopra, S., Rush, A.M., van Merri\u00ebnboer, B., Joulin, A., Mikolov, T.: Towards AI-complete question answering: a set of prerequisite toy tasks. arXiv preprint arXiv:1502.05698 (2015)"},{"key":"329_CR54","doi-asserted-by":"crossref","unstructured":"Williams, A., Nangia, N., Bowman, S.: A broad-coverage challenge corpus for sentence understanding through inference. In: Proceedings of the 2018 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, Volume 1 (Long Papers), pp. 1112\u20131122. Association for Computational Linguistics (2018)","DOI":"10.18653\/v1\/N18-1101"},{"key":"329_CR55","unstructured":"Wu, Y., Schuster, M., Chen, Z., Le, Q.V., Norouzi, M., Macherey, W., Krikun, M., Cao, Y., Gao, Q., Macherey, K., Klingner, J., Shah, A., Johnson, M., Liu, X., \u0141ukasz Kaiser, Gouws, S., Kato, Y., Kudo, T., Kazawa, H., Stevens, K., Kurian, G., Patil, N., Wang, W., Young, C., Smith, J., Riesa, J., Rudnick, A., Vinyals, O., Corrado, G., Hughes, M., Dean, J.: Google\u2019s Neural Machine Translation System: Bridging the Gap between Human and Machine Translation (2016)"},{"key":"329_CR56","unstructured":"Xiao, H.: Bert-as-service. https:\/\/github.com\/hanxiao\/bert-as-service (2018)"},{"key":"329_CR57","doi-asserted-by":"publisher","unstructured":"Xiong, W., Wu, J., Wang, H., Kulkarni, V., Yu, M., Chang, S., Guo, X., Wang, W.Y.: TWEETQA: a social media focused question answering dataset. In: Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics, pp. 5020\u20135031. Association for Computational Linguistics, Florence, Italy (2019). https:\/\/doi.org\/10.18653\/v1\/P19-1496","DOI":"10.18653\/v1\/P19-1496"},{"key":"329_CR58","doi-asserted-by":"publisher","unstructured":"Yagcioglu, S., Erdem, A., Erdem, E., Ikizler-Cinbis, N.: RecipeQA: a challenge dataset for multimodal comprehension of cooking recipes. In: Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing, pp. 1358\u20131368. Association for Computational Linguistics, Brussels, Belgium (2018). https:\/\/doi.org\/10.18653\/v1\/D18-1166","DOI":"10.18653\/v1\/D18-1166"},{"key":"329_CR59","doi-asserted-by":"publisher","unstructured":"Yang, Y., Yih, W.t., Meek, C.: WikiQA: a challenge dataset for open-domain question answering. In: Proceedings of the 2015 Conference on Empirical Methods in Natural Language Processing, pp. 2013\u20132018. Association for Computational Linguistics, Lisbon, Portugal (2015). https:\/\/doi.org\/10.18653\/v1\/D15-1237","DOI":"10.18653\/v1\/D15-1237"},{"key":"329_CR60","doi-asserted-by":"publisher","unstructured":"Yang, Z., Qi, P., Zhang, S., Bengio, Y., Cohen, W., Salakhutdinov, R., Manning, C.D.: HotpotQA: a dataset for diverse, explainable multi-hop question answering. In: Proceedings of the 2018 Conference on Empirical Methods in Natural Language Processing, pp. 2369\u20132380. Association for Computational Linguistics, Brussels, Belgium (2018). https:\/\/doi.org\/10.18653\/v1\/D18-1259","DOI":"10.18653\/v1\/D18-1259"},{"key":"329_CR61","unstructured":"Yu, A.W., Dohan, D., Le, Q., Luong, T., Zhao, R., Chen, K.: Fast and accurate reading comprehension by combining self-attention and convolution. In: International Conference on Learning Representations (2018). https:\/\/openreview.net\/forum?id=B14TlG-RW"},{"key":"329_CR62","doi-asserted-by":"crossref","unstructured":"Yuan, X., Wang, T., G\u00fcl\u00e7ehre, \u00c7., Sordoni, A., Bachman, P., Zhang, S., Subramanian, S., Trischler, A.: Machine comprehension by text-to-text neural question generation. In: Proceedings of the 2nd Workshop on Representation Learning for NLP, Rep4NLP@ACL 2017, Vancouver, Canada, August 3, 2017, pp. 15\u201325 (2017)","DOI":"10.18653\/v1\/W17-2603"},{"key":"329_CR63","unstructured":"Zhu, M., Zhang, Y., Chen, W., Zhang, M., Zhu, J.: Fast and accurate shift-reduce constituent parsing. In: Proceedings of the 51st Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 434\u2013443. Association for Computational Linguistics, Sofia, Bulgaria (2013). https:\/\/www.aclweb.org\/anthology\/P13-1043"}],"container-title":["International Journal on Digital Libraries"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00799-022-00329-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s00799-022-00329-y\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s00799-022-00329-y.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,4,8]],"date-time":"2025-04-08T23:53:34Z","timestamp":1744156414000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s00799-022-00329-y"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,7,20]]},"references-count":63,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2022,9]]}},"alternative-id":["329"],"URL":"https:\/\/doi.org\/10.1007\/s00799-022-00329-y","relation":{},"ISSN":["1432-5012","1432-1300"],"issn-type":[{"value":"1432-5012","type":"print"},{"value":"1432-1300","type":"electronic"}],"subject":[],"published":{"date-parts":[[2022,7,20]]},"assertion":[{"value":"14 May 2021","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"9 June 2022","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 June 2022","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"20 July 2022","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}