{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,3]],"date-time":"2025-09-03T10:54:28Z","timestamp":1756896868266,"version":"3.38.0"},"publisher-location":"Berlin, Heidelberg","reference-count":66,"publisher":"Springer Berlin Heidelberg","isbn-type":[{"type":"print","value":"9783540230601"},{"type":"electronic","value":"9783540286400"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2004]]},"DOI":"10.1007\/978-3-540-28640-0_1","type":"book-chapter","created":{"date-parts":[[2010,9,20]],"date-time":"2010-09-20T21:25:14Z","timestamp":1285017914000},"page":"1-16","source":"Crossref","is-referenced-by-count":12,"title":["Document Analysis Systems for Digital Libraries: Challenges and Opportunities"],"prefix":"10.1007","author":[{"given":"Henry S.","family":"Baird","sequence":"first","affiliation":[]},{"given":"Venugopal","family":"Govindaraju","sequence":"additional","affiliation":[]},{"given":"Daniel P.","family":"Lopresti","sequence":"additional","affiliation":[]}],"member":"297","reference":[{"key":"1_CR1","unstructured":"Abdelazim, H.Y., Hashish, M.A.: Application of HMM to the recognition of isolated Arabic words. In: Proceedings of 11th National Computer Conference, pp. 761\u2013774 (1989)"},{"key":"1_CR2","unstructured":"Association for Information and Image Management, International. 1100 Wayne Avenue, Suite 1100, Silver Spring, Maryland 20910; www.aiim.org"},{"key":"1_CR3","doi-asserted-by":"crossref","unstructured":"Allen, R.B., Schalow, J.: Metadata and data structures for the historical newspaper digital library. In: Proceedings of the 8th international conference on Information and knowledge management, pp. 147\u2013153 (1999)","DOI":"10.1145\/319950.319971"},{"issue":"5","key":"1_CR4","doi-asserted-by":"publisher","first-page":"517","DOI":"10.1016\/S0031-3203(97)00084-8","volume":"31","author":"A. Amin","year":"1997","unstructured":"Amin, A.: Offline Arabic character recognition: The state of the art. Pattern Recognition\u00a031(5), 517\u2013530 (1997)","journal-title":"Pattern Recognition"},{"key":"1_CR5","doi-asserted-by":"crossref","unstructured":"Antonacopoulos, A., Karatzas, D.: Document image analysis for World War II personal records. In: Proceedings of the 1st International Workshop on Document Image Analysis for Libraries. (DIAL 2004), pp. 336\u2013341 (2004)","DOI":"10.1109\/DIAL.2004.1263263"},{"key":"1_CR6","doi-asserted-by":"crossref","unstructured":"Baird, H.: Difficult and urgent open problems in document image analysis for libraries. In: Proceedings of the 1st International Workshop on Document Image Analysis for Libraries (DIAL 2004), pp. 25\u201332 (2004)","DOI":"10.1109\/DIAL.2004.1263234"},{"volume-title":"Proceedings of the International Workshop on Document Image Analysis for Libraries","year":"2004","key":"1_CR7","unstructured":"In: Baird, H.S., Govindaraju, V. (eds.): Proceedings of the International Workshop on Document Image Analysis for Libraries. IEEE Computer Society Press, Piscataway (2004)"},{"issue":"4","key":"1_CR8","doi-asserted-by":"publisher","first-page":"500","DOI":"10.1109\/3468.852443","volume":"30","author":"V. Bansal","year":"2000","unstructured":"Bansal, V.: Integrating knowledge sources in devanagari text recognition. IEEE Transactions on Systems, Man and Cybernetics Part A\u00a030(4), 500\u2013505 (2000)","journal-title":"IEEE Transactions on Systems, Man and Cybernetics Part A"},{"key":"1_CR9","doi-asserted-by":"crossref","unstructured":"Barrett, W.: Digital mountain: From granite archive to global access. In: Proceedings of the 1st International Workshop on Document Image Analysis for Libraries (DIAL 2004), pp. 104\u2013121 (2004)","DOI":"10.1109\/DIAL.2004.1263243"},{"issue":"6","key":"1_CR10","doi-asserted-by":"publisher","first-page":"495","DOI":"10.1109\/34.771314","volume":"21","author":"I. Bazzi","year":"1999","unstructured":"Bazzi, I., Schwartz, R., Makhoul, J.: An omnifont open-vocabulary OCR system for English and Arabic. IEEE Pattern Analysis and Machine Intelligence\u00a021(6), 495\u2013504 (1999)","journal-title":"IEEE Pattern Analysis and Machine Intelligence"},{"key":"1_CR11","unstructured":"Bray, T., Paoli, J., Sperberg-McQueen, C.M., Maler, E.: Extensible Markup Language (XML) 1.0, 2nd edn (2001)"},{"key":"1_CR12","doi-asserted-by":"crossref","unstructured":"Breuel, T.M., Janssen, W.C., Popat, K., Baird, H.S.: Paper to PDA. In: Proc., IAPR 16th ICPR, Quebec City, Canada, August 2002, vol.\u00a04, pp. 476\u2013479 (2002)","DOI":"10.1109\/ICPR.2002.1044766"},{"key":"1_CR13","doi-asserted-by":"crossref","unstructured":"Chaudhuri, B.B., Pal, U.: An OCR system to read two Indian language scripts: Bangla and Devanagari. In: Proceedings of the 4th International Conference on Document Analysis and Recognition, pp. 1011\u20131015 (1997)","DOI":"10.1109\/ICDAR.1997.620662"},{"key":"1_CR14","doi-asserted-by":"crossref","unstructured":"Chaudhuri, B.B., Pal, U., Mitra, M.: Automatic recognition of printed Oriya script. In: Proceedings of the 6th International Conference on Document Analysis and Recognition, pp. 795\u2013799 (2001)","DOI":"10.1109\/ICDAR.2001.953897"},{"key":"1_CR15","doi-asserted-by":"crossref","unstructured":"Chen, F.R., Bloomberg, D.: Summarization of imaged documents without OCR. Computer Vision and Image Understanding\u00a070(3) (June 1998)","DOI":"10.1006\/cviu.1998.0688"},{"key":"1_CR16","doi-asserted-by":"crossref","unstructured":"Chew, M., Baird, H.S.: BaffleText: a Human Interactive Proof. In: Proc., 10th IS&T\/SPIE Document Recognition & Retrieval Conf., Santa Clara, CA, January 23\u201324 (2003)","DOI":"10.1117\/12.479682"},{"key":"1_CR17","unstructured":"Unicode Consortium. The Unicode Standard Version 4.0. Addison-Wesley (2003)"},{"key":"1_CR18","doi-asserted-by":"crossref","unstructured":"Couasnon, B., Camillerapp, J., Leplumey, I.: Making handwritten archives documents accessible to public with a generic system of document image analysis. In: Proceedings of the 1st International Workshop on Document Image Analysis for Libraries (DIAL 2004), pp. 270\u2013277 (2004)","DOI":"10.1109\/DIAL.2004.1263255"},{"issue":"10","key":"1_CR19","doi-asserted-by":"publisher","first-page":"1297","DOI":"10.1080\/00140139208967394","volume":"35","author":"A. Dillon","year":"1992","unstructured":"Dillon, A.: Reading from paper versus screens: A critical review of the empirical literature. Ergonomics\u00a035(10), 1297\u20131326 (1992)","journal-title":"Ergonomics"},{"key":"1_CR20","doi-asserted-by":"crossref","unstructured":"Doermann, D.: The indexing and retrieval of document images: A survey. Computer Vision and Image Understanding\u00a070(3) (June 1998)","DOI":"10.1006\/cviu.1998.0692"},{"key":"1_CR21","unstructured":"E Ink, 733 Concord Avenue, Cambridge, MA 02138, www.eink.com"},{"key":"1_CR22","doi-asserted-by":"crossref","unstructured":"Govindaraju, V., Khedekar, S., Kompalli, S., Farooq, F., Setlur, S., Prasad, V.: Tools for enabling digital access to multilingual Indic documents. In: Proceedings of the 1st International Workshop on Document Image Analysis for Libraries (DIAL 2004), pp. 122\u2013133 (2004)","DOI":"10.1109\/DIAL.2004.1263244"},{"key":"1_CR23","doi-asserted-by":"crossref","unstructured":"Govindaraju, V., Xue, H.: Fast handwriting recognition for indexing historical documents. In: Proceedings of the 1st International Workshop on Document Image Analysis for Libraries. (DIAL 2004), pp. 314\u2013320 (2004)","DOI":"10.1109\/DIAL.2004.1263260"},{"key":"1_CR24","unstructured":"Green, D.: The Java Tutorial: Internationalization, java.sun.com\/docs\/books\/tutorial\/i18n\/"},{"key":"1_CR25","unstructured":"Gyricon Media, Inc., 6190 Jackson Road, Ann Arbor, MI 48103, www.gyriconmedia.com"},{"key":"1_CR26","doi-asserted-by":"crossref","unstructured":"Harit, G., Chadhury, S., Ghosh, H.: Managing document images in a digital library: An ontology guided approach. In: Proceedings of the 1st International Workshop on Document Image Analysis for Libraries. (DIAL 2004), pp. 64\u201392 (2004)","DOI":"10.1109\/DIAL.2004.1263238"},{"key":"1_CR27","doi-asserted-by":"crossref","unstructured":"Hochberg, J., Kerns, L., Kelly, P., Thomas, T.: Automatic script identification from images using cluster-based templates. In: Proceedings of the 3rd International Conference on Document Analysis and Recognition, vol.\u00a01, pp. 378\u2013381 (1995)","DOI":"10.1109\/ICDAR.1995.599017"},{"key":"1_CR28","doi-asserted-by":"crossref","unstructured":"Hutchison, L., Barrett, W.A.: Fast registration of tabular document images using Fourier analysis. In: Proceedings of the 1st International Workshop on Document Image Analysis for Libraries (DIAL 2004), pp. 253\u2013267 (2004)","DOI":"10.1109\/DIAL.2004.1263254"},{"key":"1_CR29","unstructured":"JSTOR Digital Library. University of Michigan and Princeton University, www.jstor.org"},{"key":"1_CR30","doi-asserted-by":"crossref","unstructured":"Kim, D.H., Hwang, Y.S., Park, S.T., Kim, E., Paek, S., Bang, S.: Handwritten Korean character image database. In: Proceedings of the 2nd International Conference on Document Analysis and Recognition, pp. 470\u2013473 (1993)","DOI":"10.1109\/ICDAR.1993.395693"},{"key":"1_CR31","unstructured":"Kim, M., Jang, M., Choi, H., Rhee, T., Kim, J.H.: Digitalizing scheme of handwritten Hanja historical document. In: Proceedings of the 1st International Workshop on Document Image Analysis for Libraries. (DIAL 2004), pp. 321\u2013327 (2004)"},{"key":"1_CR32","doi-asserted-by":"crossref","unstructured":"Kompalli, S., Setlur, S., Govindaraju, V., Vemulapati, R.: Creation of data resources and design of an evaluation test bed for Devanagari script recognition. In: Proceedings of the 13th International Workshop on Research Issues on Data Engineering: Multi-lingual Information Management, pp. 55\u201361 (2003)","DOI":"10.1109\/RIDE.2003.1249846"},{"key":"1_CR33","doi-asserted-by":"crossref","unstructured":"Kornfield, M., Manmatha, R., Allan, J.: Text alignment with handwritten documents. In: Proceedings of the 1st International Workshop on Document Image Analysis for Libraries. (DIAL 2004), pp. 195\u2013209 (2004)","DOI":"10.1109\/DIAL.2004.1263249"},{"key":"1_CR34","doi-asserted-by":"crossref","unstructured":"Lavrenko, V., Rath, T., Manmatha, R.: Holistic word recognition for handwritten historical documents. In: Proceedings of the 1st International Workshop on Document Image Analysis for Libraries. (DIAL 2004), pp. 278\u2013287 (2004)","DOI":"10.1109\/DIAL.2004.1263256"},{"key":"1_CR35","doi-asserted-by":"crossref","unstructured":"LeBourgeois, F., Trinh, E., Allier, B., Eglin, V., Emptoz, H.: Document images analysis solutions for digital libraries. In: Proceedings of the 1st International Workshop on Document Image Analysis for Libraries. (DIAL 2004), pp. 2\u201324 (2004)","DOI":"10.1109\/DIAL.2004.1263233"},{"issue":"3","key":"1_CR36","first-page":"811","volume":"36","author":"C.H. Lee","year":"2003","unstructured":"Lee, C.H., Kanungo, T.: The architecture of TrueViz: A groundTRUth \/ metadata editing and VIsualiZing toolkit. PR\u00a036(3), 811\u2013825 (2003)","journal-title":"PR"},{"key":"1_CR37","doi-asserted-by":"crossref","unstructured":"Loce, R.P., Dougherty, E.R.: Enhancement and Restoration of Digital Documents: Statistical Design of Nonlinear Algorithms. Society of Photo-optical Instrumentation Engineers (January 1997) ISBN 081942109X","DOI":"10.1117\/PM29"},{"issue":"2","key":"1_CR38","first-page":"198","volume":"26","author":"H. Ma","year":"2003","unstructured":"Ma, H., Doermann, D.: Adaptive Hindi OCR using generalized Hausdorff image comparison. ACM Transactions on Asian Language Information Processing\u00a026(2), 198\u2013213 (2003)","journal-title":"ACM Transactions on Asian Language Information Processing"},{"key":"1_CR39","doi-asserted-by":"crossref","unstructured":"Marinai, S., Marino, E., Cesarani, F., Soda, G.: A general system for the retrieval of document images from digital libraries. In: Proceedings of the 1st International Workshop on Document Image Analysis for Libraries. (DIAL 2004), pp. 150\u2013 173 (2004)","DOI":"10.1109\/DIAL.2004.1263246"},{"key":"1_CR40","unstructured":"Microsoft Windows glyph processing, www.microsoft.com\/typography\/developers\/opentype\/default.htm"},{"issue":"1","key":"1_CR41","doi-asserted-by":"publisher","first-page":"38","DOI":"10.1109\/34.824820","volume":"22","author":"G. Nagy","year":"2000","unstructured":"Nagy, G.: Twenty years of document image analysis in PAMI. IEEE Transactions on Pattern Analysis and Machine Intelligence\u00a022(1), 38\u201362 (2000)","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"1_CR42","doi-asserted-by":"crossref","unstructured":"Namboodiri, M., Jain, A.K.: On-line script recognition. In: Proceedings of the 16th International Conference on Pattern Recognition, pp. 736\u2013739 (2002)","DOI":"10.1109\/ICPR.2002.1048081"},{"key":"1_CR43","unstructured":"Bureau of Indian Standards. Indian script code for information interchange (1999)"},{"key":"1_CR44","doi-asserted-by":"crossref","unstructured":"Pal, U., Chaudhuri, B.B.: Script line separation from Indian multi-script documents. In: Proceedings of the 5th International Conference on Document Analysis and Recognition, pp. 406\u2013409 (1999)","DOI":"10.1109\/ICDAR.1999.791810"},{"key":"1_CR45","unstructured":"NPES\/AIIM PDF \u2013 Archive Project, www.aiim.org\/standards.asp?ID=25013"},{"key":"1_CR46","unstructured":"ProjectGutenberg, promo.net\/pg"},{"key":"1_CR47","unstructured":"Rajkumar, S.: Indic typesetting \u2013 challenges and opportunities. TUGboat, 23(1) (2002)"},{"key":"1_CR48","unstructured":"Rice, S.V., Jenkins, F.R., Nartker, T.A.: The fifth annual test of OCR accuracy. Technical report, Information Science Research Institute, Univ. of Nevada at Las Vegas, Las Vegas, Nevada (1996) ISRI TR-96-01"},{"key":"1_CR49","unstructured":"Sarkar, P., Baird, H.S., Henderson, J.: Triage of OCR output using \u2019confidence\u2019 scores. In: Proc. 9th IS&T\/SPIE Document Recognition & Retrieval Conf., San Jose, CA (January 2002)"},{"key":"1_CR50","volume-title":"The Myth of the Paperless Office","author":"J. Sellen","year":"2002","unstructured":"Sellen, J., Harper, R.H.R.: The Myth of the Paperless Office. The MIT Press, Cambridge (2002)"},{"issue":"3","key":"1_CR51","doi-asserted-by":"publisher","first-page":"154","DOI":"10.1007\/s100320200069","volume":"4","author":"S. Setlur","year":"2002","unstructured":"Setlur, S., Lawson, A., Govindaraju, V., Srihari, S.: Large scale address recognition systems \u2013 truthing, testing, tools and other evaluation issues. International Journal of Document Analysis and Recognition\u00a04(3), 154\u2013169 (2002)","journal-title":"International Journal of Document Analysis and Recognition"},{"key":"1_CR52","doi-asserted-by":"crossref","unstructured":"Shanbhag, S., Rao, D., Joshi, R.K.: An intelligent multi-layered input scheme for phonetic scripts. In: Proceedings of the 2nd International Symposium on Smart Graphics, pp. 35\u201338 (2002)","DOI":"10.1145\/569005.569011"},{"key":"1_CR53","doi-asserted-by":"crossref","unstructured":"Simske, S.J., Sturgill, M.: A ground-truthing engine for proofsetting, publishing, re-purposing and quality assurance. In: Proceedings of the 2003 ACM Symposium on Document Engineering, pp. 150\u2013152 (2003)","DOI":"10.1145\/958220.958247"},{"issue":"6","key":"1_CR54","doi-asserted-by":"publisher","first-page":"623","DOI":"10.1109\/34.601250","volume":"19","author":"B.K. Sin","year":"1997","unstructured":"Sin, B.K., Kim, J.H.: Ligature modeling for online cursive script recognition. IEEE Transactions on Pattern Analysis and Machine Intelligence\u00a019(6), 623\u2013633 (1997)","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"1_CR55","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1007\/3-540-45869-7_1","volume-title":"Document Analysis Systems V","author":"E.H. Barney Smith","year":"2002","unstructured":"Barney Smith, E.H., Qiu, X.: Relating statistical image differences and degradation features. In: Lopresti, D.P., Hu, J., Kashi, R.S. (eds.) DAS 2002. LNCS, vol.\u00a02423, pp. 1\u201312. Springer, Heidelberg (2002)"},{"key":"1_CR56","doi-asserted-by":"publisher","first-page":"242","DOI":"10.1142\/9789812797704_0013","volume-title":"Document Analysis Systems II","author":"L. Spitz","year":"1998","unstructured":"Spitz, L.: SPAM: A scientific paper access method. In: Document Analysis Systems II, pp. 242\u2013255. World Scientific, Singapore (1998)"},{"key":"1_CR57","unstructured":"Srihari, S.N., Kuebert, E.J.: Integration of handwritten address interpretation technology into the United States Postal Service remote computer reader system. In: Proceedings of the 4th International Conference on Document Analysis and Recognition (1997)"},{"key":"1_CR58","unstructured":"Stork, D.G.: The Open Mind initiative. In: Proc., IEEE Expert Systems and Their Applications, pp. 16\u201320 (May\/June 1999), www.openmind.org"},{"key":"1_CR59","doi-asserted-by":"crossref","first-page":"73","DOI":"10.1117\/12.476023","volume-title":"Proc., SPIE\/IS&T Electronic Imaging Conf. on Document Recognition & Retrieval X","author":"K. Summers","year":"2003","unstructured":"Summers, K.: Document image improvement for OCR as a classification problem. In: Proc., SPIE\/IS&T Electronic Imaging Conf. on Document Recognition & Retrieval X, Santa Clara, CA, January 2003, vol.\u00a05010, pp. 73\u201383. SPIE, San Jose (2003)"},{"key":"1_CR60","unstructured":"Sun Solaris 9 operating system features and benefits \u2013 compatibility, www.sun.com\/software\/solaris\/sparc\/solaris9featurescompatibility.html"},{"key":"1_CR61","doi-asserted-by":"crossref","unstructured":"Tai, J.-W., Liu, Y.-J., Zhang, L.-Q.: A model based detecting approach for feature extraction of off-line handwritten Chinese character recognition. In: Proceedings of the 2nd International Conference on Document Analysis and Recognition (1993)","DOI":"10.1109\/ICDAR.1993.395610"},{"issue":"7","key":"1_CR62","doi-asserted-by":"publisher","first-page":"751","DOI":"10.1109\/34.689305","volume":"20","author":"T.N. Tan","year":"1998","unstructured":"Tan, T.N.: Rotation invariant texture features and their use in automatic script identification. IEEE Transactions on Pattern Analysis and Machine Intelligence\u00a020(7), 751\u2013756 (1998)","journal-title":"IEEE Transactions on Pattern Analysis and Machine Intelligence"},{"key":"1_CR63","unstructured":"The XML version of the TEI guidelines, www.tei-c.org\/P4X\/CH.html"},{"key":"1_CR64","doi-asserted-by":"crossref","unstructured":"Wang, A.-B., Huang, J.S., Fan, K.-C.: Optical recognition of handwritten chinese characters by partial matching. In: Proceedings of the 2nd International Conference on Document Analysis and Recognition (1993)","DOI":"10.1109\/ICDAR.1993.395611"},{"key":"1_CR65","doi-asserted-by":"crossref","unstructured":"Yosef, B., Kedem, K., Dinstein, I., Beit-Arie, M., Engel, E.: Classification of Hebrew calligraphic handwriting styles: Preliminary results. In: Proceedings of the 1st International Workshop on Document Image Analysis for Libraries (DIAL 2004), pp. 299\u2013305 (2004)","DOI":"10.1109\/DIAL.2004.1263258"},{"key":"1_CR66","doi-asserted-by":"crossref","unstructured":"Zhang, B., Tomai, C., Srihari, S., Govindaraju, V.: Construction of handwriting databases using transcript-based mapping. In: Proceedings of the 1st International Workshop on Document Image Analysis for Libraries (DIAL 2004), pp. 288\u2013298 (2004)","DOI":"10.1109\/DIAL.2004.1263257"}],"container-title":["Lecture Notes in Computer Science","Document Analysis Systems VI"],"original-title":[],"link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-540-28640-0_1.pdf","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,2,25]],"date-time":"2025-02-25T23:15:27Z","timestamp":1740525327000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/978-3-540-28640-0_1"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2004]]},"ISBN":["9783540230601","9783540286400"],"references-count":66,"URL":"https:\/\/doi.org\/10.1007\/978-3-540-28640-0_1","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2004]]}}}