{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,26]],"date-time":"2025-03-26T18:33:21Z","timestamp":1743014001402,"version":"3.40.3"},"publisher-location":"Cham","reference-count":27,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031463105"},{"type":"electronic","value":"9783031463112"}],"license":[{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023]]},"DOI":"10.1007\/978-3-031-46311-2_11","type":"book-chapter","created":{"date-parts":[[2023,10,28]],"date-time":"2023-10-28T19:01:50Z","timestamp":1698519710000},"page":"128-137","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":1,"title":["End-to-End Multilingual Text Recognition Based on\u00a0Byte Modeling"],"prefix":"10.1007","author":[{"given":"Jiajia","family":"Wu","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Kun","family":"Zhao","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Zhengyan","family":"Yang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Bing","family":"Yin","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Cong","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lirong","family":"Dai","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2023,10,29]]},"reference":[{"key":"11_CR1","series-title":"Communications in Computer and Information Science","doi-asserted-by":"publisher","first-page":"187","DOI":"10.1007\/978-3-642-35292-8_20","volume-title":"Advances in Speech and Language Technologies for Iberian Languages","author":"MA del Agua","year":"2012","unstructured":"del Agua, M.A., Serrano, N., Civera, J., Juan, A.: Character-based handwritten text recognition of multilingual documents. In: Torre Toledano, D., et al. (eds.) IberSPEECH 2012. CCIS, vol. 328, pp. 187\u2013196. Springer, Heidelberg (2012). https:\/\/doi.org\/10.1007\/978-3-642-35292-8_20"},{"key":"11_CR2","unstructured":"Bahdanau, D., Cho, K., Bengio, Y.: Neural machine translation by jointly learning to align and translate. In: International Conference on Learning Representations (2015)"},{"issue":"3","key":"11_CR3","first-page":"21","volume":"5","author":"J Bettels","year":"1993","unstructured":"Bettels, J., Bishop, F.A.: Unicode: a universal character code. Digit. Tech. J. 5(3), 21\u201331 (1993)","journal-title":"Digit. Tech. J."},{"issue":"4","key":"11_CR4","first-page":"467","volume":"18","author":"PF Brown","year":"1992","unstructured":"Brown, P.F., Della Pietra, V.J., Desouza, P.V., Lai, J.C., Mercer, R.L.: Class-based n-gram models of natural language. Comput. Linguist. 18(4), 467\u2013480 (1992)","journal-title":"Comput. Linguist."},{"key":"11_CR5","doi-asserted-by":"publisher","unstructured":"Gillick, D., Brunk, C., Vinyals, O., Subramanya, A.: Multilingual language processing from bytes. In: Proceedings of the 2016 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, pp. 1296\u20131306. Association for Computational Linguistics, San Diego, California (2016). https:\/\/doi.org\/10.18653\/v1\/N16-1155","DOI":"10.18653\/v1\/N16-1155"},{"key":"11_CR6","doi-asserted-by":"publisher","unstructured":"Graves, A.: Supervised sequence labelling. in: supervised sequence labelling with recurrent neural networks. Studies in Computational Intelligence, vol. 385. Springer, Berlin, Heidelberg (2012). https:\/\/doi.org\/10.1007\/978-3-642-24797-2_2","DOI":"10.1007\/978-3-642-24797-2_2"},{"key":"11_CR7","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: 2016 IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2016)","DOI":"10.1109\/CVPR.2016.90"},{"issue":"8","key":"11_CR8","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S Hochreiter","year":"1997","unstructured":"Hochreiter, S., Schmidhuber, J.: Long short-term memory. Neural Comput. 9(8), 1735\u20131780 (1997)","journal-title":"Neural Comput."},{"key":"11_CR9","doi-asserted-by":"crossref","unstructured":"Huang, J., et al.: A multiplexed network for end-to-end, multilingual OCR. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 4547\u20134557 (2021)","DOI":"10.1109\/CVPR46437.2021.00452"},{"key":"11_CR10","doi-asserted-by":"crossref","unstructured":"Jean, S., Cho, K., Memisevic, R., Bengio, Y.: On using very large target vocabulary for neural machine translation (2014)","DOI":"10.3115\/v1\/P15-1001"},{"key":"11_CR11","unstructured":"Kingma, D., Ba, J.: Adam: A method for stochastic optimization. Computer Science (2014)"},{"key":"11_CR12","doi-asserted-by":"crossref","unstructured":"Li, B., Zhang, Y., Sainath, T., Wu, Y., Chan, W.: Bytes are all you need: End-to-end multilingual speech recognition and synthesis with bytes. In: ICASSP 2019\u20132019 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 5621\u20135625. IEEE (2019)","DOI":"10.1109\/ICASSP.2019.8682674"},{"key":"11_CR13","doi-asserted-by":"crossref","unstructured":"Ma, L.L., Liu, C.L.: On-line handwritten Chinese character recognition based on nested segmentation of radicals. In: 2009 Chinese Conference on Pattern Recognition, pp. 1\u20135. IEEE (2009)","DOI":"10.1109\/CCPR.2009.5343976"},{"key":"11_CR14","doi-asserted-by":"crossref","unstructured":"Mikolov, T., Karafi\u00e1t, M., Burget, L., Cernock\u1ef3, J., Khudanpur, S.: Recurrent neural network based language model. In: Interspeech. vol. 2, pp. 1045\u20131048. Makuhari (2010)","DOI":"10.21437\/Interspeech.2010-343"},{"key":"11_CR15","unstructured":"Mikolov, T., Sutskever, I., Deoras, A., Le, H.S., Kombrink, S., Cernock\u00fd, J.H.: Subword language modeling with neural networks (2011)"},{"key":"11_CR16","doi-asserted-by":"publisher","unstructured":"Sennrich, R., Haddow, B., Birch, A.: Neural machine translation of rare words with subword units. In: Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 1715\u20131725. Association for Computational Linguistics, Berlin, Germany (2016). https:\/\/doi.org\/10.18653\/v1\/P16-1162","DOI":"10.18653\/v1\/P16-1162"},{"issue":"11","key":"11_CR17","doi-asserted-by":"publisher","first-page":"2298","DOI":"10.1109\/TPAMI.2016.2646371","volume":"39","author":"B Shi","year":"2016","unstructured":"Shi, B., Bai, X., Yao, C.: An end-to-end trainable neural network for image-based sequence recognition and its application to scene text recognition. IEEE Trans. Pattern Anal. Mach. Intell. 39(11), 2298\u20132304 (2016)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"issue":"9","key":"11_CR18","doi-asserted-by":"publisher","first-page":"2035","DOI":"10.1109\/TPAMI.2018.2848939","volume":"41","author":"B Shi","year":"2018","unstructured":"Shi, B., Yang, M., Wang, X., Lyu, P., Yao, C., Bai, X.: Aster: an attentional scene text recognizer with flexible rectification. IEEE Trans. Pattern Anal. Mach. Intell. 41(9), 2035\u20132048 (2018)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"11_CR19","unstructured":"Smith, L.N., Topin, N.: Super-convergence: Very fast training of neural networks using large learning rates (2017)"},{"key":"11_CR20","doi-asserted-by":"crossref","unstructured":"Snyder, B., Barzilay, R.: Unsupervised multilingual learning for morphological segmentation. In: Proceedings of ACL-08: HLT, pp. 737\u2013745. Association for Computational Linguistics, Columbus, Ohio (2008)","DOI":"10.3115\/1613715.1613851"},{"key":"11_CR21","doi-asserted-by":"publisher","first-page":"125","DOI":"10.1016\/j.patcog.2015.07.009","volume":"51","author":"S Tian","year":"2016","unstructured":"Tian, S., et al.: Multilingual scene character recognition with co-occurrence of histogram of oriented gradients. Pattern Recogn. 51, 125\u2013134 (2016)","journal-title":"Pattern Recogn."},{"key":"11_CR22","unstructured":"Tiedemann, J.: Character-based PSMT for closely related languages. In: Proceedings of the 13th Annual Conference of the European Association for Machine Translation. European Association for Machine Translation, Barcelona, Spain (2009)"},{"key":"11_CR23","doi-asserted-by":"crossref","unstructured":"Tu, Z., Lu, Z., Yang, L., Liu, X., Hang, L.: Modeling coverage for neural machine translation. In: Proceedings of the 54th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers) (2016)","DOI":"10.18653\/v1\/P16-1008"},{"key":"11_CR24","doi-asserted-by":"crossref","unstructured":"Vilar, D., Peter, J.T., Ney, H.: Can we translate letters? In: Proceedings of the Second Workshop on Statistical Machine Translation, pp. 33\u201339. Association for Computational Linguistics, Prague, Czech Republic (2007)","DOI":"10.3115\/1626355.1626360"},{"key":"11_CR25","doi-asserted-by":"crossref","unstructured":"Wang, C., Cho, K., Gu, J.: Neural machine translation with byte-level subwords. In: Proceedings of the AAAI Conference on Artificial Intelligence. vol. 34, pp. 9154\u20139160 (2020)","DOI":"10.1609\/aaai.v34i05.6451"},{"issue":"8","key":"11_CR26","doi-asserted-by":"publisher","first-page":"1469","DOI":"10.1109\/TPAMI.2011.264","volume":"34","author":"QF Wang","year":"2011","unstructured":"Wang, Q.F., Yin, F., Liu, C.L.: Handwritten Chinese text recognition by integrating multiple contexts. IEEE Trans. Pattern Anal. Mach. Intell. 34(8), 1469\u20131481 (2011)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"11_CR27","doi-asserted-by":"crossref","unstructured":"Xie, Z., Huang, Y., Zhu, Y., Jin, L., Liu, Y., Xie, L.: Aggregation cross-entropy for sequence recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 6538\u20136547 (2019)","DOI":"10.1109\/CVPR.2019.00670"}],"container-title":["Lecture Notes in Computer Science","Image and Graphics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-46311-2_11","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,10,28]],"date-time":"2023-10-28T19:03:25Z","timestamp":1698519805000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-46311-2_11"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023]]},"ISBN":["9783031463105","9783031463112"],"references-count":27,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-46311-2_11","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2023]]},"assertion":[{"value":"29 October 2023","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ICIG","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Image and Graphics","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Nanjing","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"China","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2023","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"22 September 2023","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"24 September 2023","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"12","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"icig2023","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/icig2023.csig.org.cn\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Conference Management Toolkit","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"409","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"166","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"41% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}