{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,1]],"date-time":"2025-08-01T03:54:03Z","timestamp":1754020443162,"version":"3.28.0"},"reference-count":35,"publisher":"IEEE","content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2016,10]]},"DOI":"10.1109\/escience.2016.7870884","type":"proceedings-article","created":{"date-parts":[[2017,3,6]],"date-time":"2017-03-06T22:09:29Z","timestamp":1488838169000},"page":"41-50","source":"Crossref","is-referenced-by-count":6,"title":["Cooperative human-machine data extraction from biological collections"],"prefix":"10.1109","author":[{"given":"Icaro","family":"Alzuru","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Andrea","family":"Matsunaga","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Mauricio","family":"Tsugawa","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Jose A. B.","family":"Fortes","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref33","article-title":"pyxDamerauLevenshtein","author":"fairchild","year":"2015","journal-title":"Github"},{"journal-title":"Advanced Computing and Information Systems (ACIS) laboratory","article-title":"HuMaIN: Human and Machine Intelligent Network","year":"0","key":"ref32"},{"key":"ref31","article-title":"A survey of text similarity approaches. International Journal of Computer Applications","volume":"68","author":"gomaa","year":"2013"},{"article-title":"LABELX Label Annotation Through Biodiversity Enhanced Learning","year":"2014","author":"heidorn","key":"ref30"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.2200\/S00516ED2V01Y201306CAC024"},{"year":"0","key":"ref34","article-title":"Symbiota Introduction"},{"journal-title":"iDigBio Wiki","article-title":"Augmenting OCR","year":"2014","key":"ref10"},{"key":"ref11","article-title":"SALIX, the Semi-automatic Label Information Extraction system","author":"lafferty","year":"2012","journal-title":"Tempe School of Life Sciences Arizona State University"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.12705\/623.16"},{"key":"ref13","article-title":"OCRoRACT: A Sequence Learning OCR System Trained on Isolated Characters","author":"ui-hasan","year":"2016","journal-title":"10th IAPR International Workshop on Document Analysis Systems"},{"article-title":"Extraction and Parsing of Herbarium Specimen Data: Exploring the Use of the Dublin Core Application Profile Framework","year":"2010","author":"moen","key":"ref14"},{"key":"ref15","article-title":"Tesseract Vs GOCR A Comparative Study)","volume":"2","author":"dhiman","year":"2013","journal-title":"International Journal of Recent Technology and Engineering (IJRTE)"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICDAR.2013.140"},{"key":"ref17","article-title":"ocropy","author":"breuel","year":"2010","journal-title":"Github"},{"key":"ref18","article-title":"Tesseract","author":"smith","year":"2007","journal-title":"Github"},{"key":"ref19","first-page":"629","article-title":"An Overview of the Tesseract OCR Engine","volume":"2","author":"smith","year":"2007","journal-title":"Proc of the International Conference on Document Analysis and Recognition"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1017\/CBO9781139924801"},{"key":"ref4","article-title":"Approaches to estimating the universe of natural history collections data","volume":"7","author":"arifio","year":"2010","journal-title":"Biodiversity Informatics"},{"year":"0","key":"ref27","article-title":"label-data"},{"key":"ref3","doi-asserted-by":"crossref","first-page":"7","DOI":"10.3897\/zookeys.209.3313","article-title":"Mass digitization of scientificcollections: New opportunities to transform the use of biological specimens and underwrite biodiversity science","author":"beaman","year":"2012","journal-title":"ZooKeys"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.3897\/zookeys.209.3146"},{"article-title":"SALIX 2","year":"2013","author":"lafferty","key":"ref29"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.3897\/zookeys.209.3178"},{"year":"0","key":"ref8","article-title":"Notes From Nature"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1016\/j.future.2015.07.004"},{"key":"ref2","article-title":"Scientific Collections: Mission-Critical Infrastructure for Federal Service Agencies","author":"bentley","year":"2009","journal-title":"Interagency Working Group on Scientific Collections(IW\/GSC)"},{"article-title":"Store First & Ask Questions Later","year":"2014","author":"wagner","key":"ref9"},{"journal-title":"UK NatSCA","article-title":"A Matter of Life and Death: Natural science collections: why keep them and why fund them?","year":"2005","key":"ref1"},{"key":"ref20","article-title":"Record Linkage Algorithms in F#_ Extensions to Jaro-Winkler Distance (Part 3) &#x00AB; Inviting Epiphany","author":"minerich","year":"2011","journal-title":"richardminerich com"},{"year":"0","key":"ref22","article-title":"Collaborative Data Extraction Scripts"},{"journal-title":"Wikipedia","article-title":"Optical character recognition","year":"2016","key":"ref21"},{"journal-title":"Wikipedia","article-title":"Jaro-Winkler distance","year":"2016","key":"ref24"},{"key":"ref23","article-title":"jellyfish 0.5.3","author":"turk","year":"2016","journal-title":"Python Org"},{"year":"2015","key":"ref26","article-title":"Darwin Core Terms: A quick reference guide"},{"year":"2015","key":"ref25","article-title":"Darwin Core"}],"event":{"name":"2016 IEEE 12th International Conference on e-Science (e-Science)","start":{"date-parts":[[2016,10,23]]},"location":"Baltimore, MD, USA","end":{"date-parts":[[2016,10,27]]}},"container-title":["2016 IEEE 12th International Conference on e-Science (e-Science)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/7864292\/7870873\/07870884.pdf?arnumber=7870884","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,10,3]],"date-time":"2020-10-03T12:09:16Z","timestamp":1601726956000},"score":1,"resource":{"primary":{"URL":"http:\/\/ieeexplore.ieee.org\/document\/7870884\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2016,10]]},"references-count":35,"URL":"https:\/\/doi.org\/10.1109\/escience.2016.7870884","relation":{},"subject":[],"published":{"date-parts":[[2016,10]]}}}