{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,14]],"date-time":"2026-03-14T18:07:01Z","timestamp":1773511621474,"version":"3.50.1"},"publisher-location":"Cham","reference-count":37,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783030865160","type":"print"},{"value":"9783030865177","type":"electronic"}],"license":[{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021]]},"DOI":"10.1007\/978-3-030-86517-7_20","type":"book-chapter","created":{"date-parts":[[2021,9,9]],"date-time":"2021-09-09T10:08:05Z","timestamp":1631182085000},"page":"319-334","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":5,"title":["Analyzing Research Trends in Inorganic Materials Literature Using NLP"],"prefix":"10.1007","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-5914-009X","authenticated-orcid":false,"given":"Fusataka","family":"Kuniyoshi","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4212-9008","authenticated-orcid":false,"given":"Jun","family":"Ozawa","sequence":"additional","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2330-6972","authenticated-orcid":false,"given":"Makoto","family":"Miwa","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2021,9,10]]},"reference":[{"key":"20_CR1","unstructured":"Akbik, A., Bergmann, T., Blythe, D., Rasul, K., Schweter, S., Vollgraf, R.: FLAIR: an easy-to-use framework for state-of-the-art NLP. In: Annual Conference of the North American Chapter of the Association for Computational Linguistics (NAACL-HLT) (2019)"},{"key":"20_CR2","unstructured":"Kuniyoshi, F., Makino, K., Ozawa, J., Miwa, M.: Annotating and Extracting Synthesis Process of All-Solid-State Batteries from Scientific Literature. In: International Conference on Language Resources and Evaluation (LREC) (2020)"},{"key":"20_CR3","doi-asserted-by":"publisher","first-page":"95","DOI":"10.1038\/s41586-019-1335-8","volume":"571","author":"V Tshitoyan","year":"2019","unstructured":"Tshitoyan, V., et al.: Unsupervised word embeddings capture latent knowledge from materials science literature. Nature 571, 95\u201398 (2019)","journal-title":"Nature"},{"key":"20_CR4","unstructured":"Devlin, J., Chang, M., Lee, K., Toutanova, K.: BERT: pre-training of deep bidirectional transformers for language understanding. In: Annual Conference of the North American Chapter of the Association for Computational Linguistics (NAACL-HLT) (2019)"},{"key":"20_CR5","doi-asserted-by":"crossref","unstructured":"Beltagy, I., Lo, K., Cohan, A.: SciBERT: a pretrained language model for scientific text. In: International Joint Conference on Natural Language Processing(IJCNLP), 2019","DOI":"10.18653\/v1\/D19-1371"},{"key":"20_CR6","doi-asserted-by":"publisher","first-page":"260","DOI":"10.1038\/s41597-020-00602-2","volume":"7","author":"S Huang","year":"2020","unstructured":"Huang, S., Cole, J.: A database of battery materials auto-generated using ChemDataExtractor. Sci. Data 7, 260 (2020)","journal-title":"Sci. Data"},{"key":"20_CR7","unstructured":"Chaitanya, K., Wei, X., Alan, R., Raghu, M.: An annotated corpus for machine reading of instructions in wet lab protocols. In: Annual Conference of the North American Chapter of the Association for Computational Linguistics (NAACL-HLT) (2018)"},{"key":"20_CR8","unstructured":"Stenetorp, P., Pyysalo, S., Topic, G., Ohta, T., Ananiadou, S., Tsujii, J.: Brat: a Web-based Tool for NLP-Assisted Text Annotation. In: European Chapter of the Association for Computational Linguistics (EACL) (2012)"},{"key":"20_CR9","doi-asserted-by":"publisher","first-page":"3847","DOI":"10.1039\/C4TA04910A","volume":"3","author":"Q Yuan","year":"2015","unstructured":"Yuan, Q., Liu, P., Baker, G.: Sulfonated polyimide and PVDF based blend proton exchange membranes for fuel cell applications. J. Mater. Chem. 3, 3847\u20133853 (2015)","journal-title":"J. Mater. Chem."},{"issue":"3","key":"20_CR10","doi-asserted-by":"publisher","first-page":"1194","DOI":"10.1021\/acs.jcim.9b00995","volume":"60","author":"E Kim","year":"2020","unstructured":"Kim, E., et al.: Inorganic materials synthesis planning with literature-trained neural networks. J. Chem. Inf. Modeling 60(3), 1194\u20131201 (2020)","journal-title":"J. Chem. Inf. Modeling"},{"key":"20_CR11","unstructured":"Gu, Y., et al.: Domain-Specific Language Model Pretraining for Biomedical Natural Language Processing. In: ArXiv, abs\/2007.15779 (2020)"},{"key":"20_CR12","unstructured":"Wolf, T., et al.: Transformers: state-of-the-art natural language processing. In: Empirical Methods in Natural Language Processing (EMNLP) (2020)"},{"key":"20_CR13","doi-asserted-by":"publisher","first-page":"S2","DOI":"10.1186\/1758-2946-7-S1-S2","volume":"7","author":"M Krallinger","year":"2015","unstructured":"Krallinger, M., et al.: The CHEMDNER corpus of chemicals and drugs and its annotation principles. J. Cheminformatics 7, S2\u2013S2 (2015)","journal-title":"J. Cheminformatics"},{"key":"20_CR14","unstructured":"Takuya, A., Shotaro, S., Toshihiko, Y., Takeru, O., Masanori, K.: Optuna: a next-generation hyperparameter optimization framework. In: International Conference on Knowledge Discovery and Data Mining (SIGKDD) (2019)"},{"key":"20_CR15","doi-asserted-by":"crossref","unstructured":"Court, C.J., Cole, J.: Magnetic and superconducting phase diagrams and transition temperatures predicted using text mining and machine learning. npj Comput. Mater. 6, 1\u20139 (2020)","DOI":"10.1038\/s41524-020-0287-8"},{"key":"20_CR16","doi-asserted-by":"crossref","unstructured":"Kononova, O., et al.: Opportunities and challenges of text mining in aterials research. iScience 24, 3 (2021)","DOI":"10.1016\/j.isci.2021.102155"},{"key":"20_CR17","unstructured":"Akbik, A., Blythe, D., Vollgraf, R.: Contextual string embeddings for sequence labeling. In: International Conference on Computational Linguistics (COLING) (2018)"},{"key":"20_CR18","unstructured":"Huang, Z., Xu, W., Yu, K.: Bidirectional LSTM-CRF Models for Sequence Tagging. In: ArXiv, abs\/1508.01991 (2015)"},{"key":"20_CR19","doi-asserted-by":"crossref","unstructured":"Bada, M., et al.: Concept annotation in the CRAFT corpus. BMC Bioinform. 13, 161 (2011)","DOI":"10.1186\/1471-2105-13-161"},{"issue":"Suppl 1","key":"20_CR20","doi-asserted-by":"publisher","first-page":"i180","DOI":"10.1093\/bioinformatics\/btg1023","volume":"19","author":"JD Kim","year":"2003","unstructured":"Kim, J.D., Ohta, T., Tateisi, Y., Tsujii, J.: GENIA corpus - a semantically annotated corpus for bio-textmining. BMC Bioinformatics 19(Suppl 1), i180-2 (2003)","journal-title":"BMC Bioinformatics"},{"key":"20_CR21","doi-asserted-by":"publisher","first-page":"95","DOI":"10.1038\/s41586-019-1335-8","volume":"571","author":"V Tshitoyan","year":"2019","unstructured":"Tshitoyan, V., et al.: Unsupervised word embeddings capture latent knowledge from materials science literature. Nature 571, 95\u201398 (2019)","journal-title":"Nature"},{"key":"20_CR22","doi-asserted-by":"publisher","first-page":"892","DOI":"10.1021\/acscentsci.9b00193","volume":"5","author":"Z Jensen","year":"2019","unstructured":"Jensen, Z., et al.: A Machine Learning Approach to Zeolite Synthesis Enabled by Automatic Literature Data Extraction. ACS Central Science 5, 892\u2013899 (2019)","journal-title":"ACS Central Science"},{"key":"20_CR23","doi-asserted-by":"publisher","first-page":"9436","DOI":"10.1021\/acs.chemmater.7b03500","volume":"29","author":"E Kim","year":"2017","unstructured":"Kim, E., Huang, K., Saunders, A., McCallum, A., Ceder, G., Olivetti, E.: Materials Synthesis Insights from Scientific Literature via Text Extraction and Machine Learning. Chemistry of Materials 29, 9436\u20139444 (2017)","journal-title":"Chemistry of Materials"},{"key":"20_CR24","doi-asserted-by":"publisher","DOI":"10.1038\/sdata.2017.127","volume":"4","author":"E Kim","year":"2017","unstructured":"Kim, E., et al.: Machine-learned and codified synthesis parameters of oxide materials. Scientific Data 4, 170127 (2017)","journal-title":"Scientific Data"},{"key":"20_CR25","doi-asserted-by":"publisher","DOI":"10.1063\/1.5009942","volume":"123","author":"SR Young","year":"2018","unstructured":"Young, S.R., et al.: Data Mining for better material synthesis: the case of pulsed laser deposition of complex oxides. J. Appl. Phys. 123, 115303 (2018)","journal-title":"J. Appl. Phys."},{"key":"20_CR26","unstructured":"Yamaguchi, K., Asahi, R., Sasaki, Y.: SC-CoMIcs: a superconductivity corpus for materials informatics. In: International Conference on Language Resources and Evaluation (LREC) (2020)"},{"key":"20_CR27","doi-asserted-by":"publisher","first-page":"100999","DOI":"10.1016\/j.joi.2019.100999","volume":"14","author":"YK Jeong","year":"2020","unstructured":"Jeong, Y.K., Xie, Q., Yan, E., Song, M.: Examining drug and side effect relation using author-entity pair bipartite networks. J. Informetrics 14, 100999 (2020)","journal-title":"J. Informetrics"},{"key":"20_CR28","doi-asserted-by":"crossref","unstructured":"Hansson, L., et al.: Semantic text mining in early drug discovery for type 2 diabetes. PLoS ONE 15(6) (2020)","DOI":"10.1371\/journal.pone.0233956"},{"key":"20_CR29","doi-asserted-by":"publisher","first-page":"829","DOI":"10.1038\/nrg3337","volume":"13","author":"D Rebholz-Schuhmann","year":"2012","unstructured":"Rebholz-Schuhmann, D., Oellrich, A., Hoehndorf, R.: Text-mining solutions for biomedical research: enabling integrative biology. Nature Reviews Genetics 13, 829\u2013839 (2012)","journal-title":"Nature Reviews Genetics"},{"key":"20_CR30","doi-asserted-by":"publisher","first-page":"203","DOI":"10.1038\/s41597-019-0224-1","volume":"6","author":"O Kononova","year":"2019","unstructured":"Kononova, O., et al.: Text-mined dataset of inorganic materials synthesis recipes. Scientific Data 6, 203 (2019)","journal-title":"Scientific Data"},{"key":"20_CR31","doi-asserted-by":"publisher","first-page":"106860","DOI":"10.1016\/j.elecom.2020.106860","volume":"121","author":"R Mahbub","year":"2020","unstructured":"Mahbub, R., Huang, K., Jensen, Z., Hood, Z.D., Rupp, J., Olivetti, E.: Text mining for processing conditions of solid-state battery electrolyte. Electrochemistry Commun. 121, 106860 (2020)","journal-title":"Electrochemistry Commun."},{"key":"20_CR32","doi-asserted-by":"crossref","unstructured":"Weber, L., S\u00e4nger, M., Munchmeyer, J., Habibi, M., Leser, U.: HunFlair: an easy-to-use tool for state-of-the-art biomedical named entity recognition. BMC Bioinfomatics (2021)","DOI":"10.1093\/bioinformatics\/btab042"},{"key":"20_CR33","doi-asserted-by":"crossref","unstructured":"Huo, H., et al.: Semi-supervised machine-learning classification of materials synthesis procedures. npj Computational Materials 5, 1\u20137 (2019)","DOI":"10.1038\/s41524-019-0204-1"},{"key":"20_CR34","doi-asserted-by":"publisher","first-page":"1759","DOI":"10.1093\/bioinformatics\/bts237","volume":"28","author":"M Miwa","year":"2012","unstructured":"Miwa, M., Thompson, P., Ananiadou, S.: Boosting automatic event extraction from the literature using domain adaptation and coreference resolution. BMC Bioinf. 28, 1759\u20131765 (2012)","journal-title":"BMC Bioinf."},{"key":"20_CR35","doi-asserted-by":"crossref","unstructured":"Bj\u00f6rne, J., Salakoski, T.: Biomedical event extraction using convolutional neural networks and dependency parsing. In: Workshop on Biomedical Natural Language Processing (BioNLP) (2018)","DOI":"10.18653\/v1\/W18-2311"},{"key":"20_CR36","doi-asserted-by":"crossref","unstructured":"Mysore, S., et al.: The materials science procedural text corpus: annotating materials synthesis procedures with shallow semantic structures. In: Linguistic Annotation Workshop (LAW) (2019)","DOI":"10.18653\/v1\/W19-4007"},{"key":"20_CR37","unstructured":"Mikolov, T., Sutskever, I., Chen, K., Corrado, G.S., Dean, J.: Distributed representations of words and phrases and their compositionality. In: Neural Information Processing Systems (NeurIPS) (2013)"}],"container-title":["Lecture Notes in Computer Science","Machine Learning and Knowledge Discovery in Databases. Applied Data Science Track"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-86517-7_20","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,8]],"date-time":"2025-09-08T22:03:29Z","timestamp":1757369009000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-86517-7_20"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021]]},"ISBN":["9783030865160","9783030865177"],"references-count":37,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-86517-7_20","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021]]},"assertion":[{"value":"10 September 2021","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECML PKDD","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Joint European Conference on Machine Learning and Knowledge Discovery in Databases","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Bilbao","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Spain","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2021","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"13 September 2021","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"17 September 2021","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"21","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"ecml2021","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/2021.ecmlpkdd.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"EasyChair","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"869","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"210","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"24% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3-4","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3-9","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"The conference was held online due to the COVID-19 pandemic.","order":10,"name":"additional_info_on_review_process","label":"Additional Info on Review Process","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}