{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T05:59:02Z","timestamp":1777615142196,"version":"3.51.4"},"publisher-location":"Cham","reference-count":43,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031416842","type":"print"},{"value":"9783031416859","type":"electronic"}],"license":[{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023]]},"DOI":"10.1007\/978-3-031-41685-9_14","type":"book-chapter","created":{"date-parts":[[2023,8,18]],"date-time":"2023-08-18T14:04:59Z","timestamp":1692367499000},"page":"217-235","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":2,"title":["DSS: Synthesizing Long Digital Ink Using Data Augmentation, Style Encoding and\u00a0Split Generation"],"prefix":"10.1007","author":[{"given":"Aleksandr","family":"Timofeev","sequence":"first","affiliation":[]},{"given":"Anastasiia","family":"Fadeeva","sequence":"additional","affiliation":[]},{"given":"Andrei","family":"Afonin","sequence":"additional","affiliation":[]},{"given":"Claudiu","family":"Musat","sequence":"additional","affiliation":[]},{"given":"Andrii","family":"Maksai","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,8,19]]},"reference":[{"key":"14_CR1","doi-asserted-by":"crossref","unstructured":"Aksan, E., Pece, F., Hilliges, O.: DeepWriting: Making Digital Ink Editable via Deep Generative Modeling. In: SIGCHI Conference on Human Factors in Computing Systems. CHI 2018, New York, NY, USA. ACM (2018)","DOI":"10.1145\/3173574.3173779"},{"key":"14_CR2","doi-asserted-by":"crossref","unstructured":"Alonso, E., Moysset, B., Messina, R.O.: Adversarial generation of handwritten text images conditioned on sequences. In: 2019 International Conference on Document Analysis and Recognition (ICDAR), pp. 481\u2013486 (2019)","DOI":"10.1109\/ICDAR.2019.00083"},{"key":"14_CR3","unstructured":"Anil, C., et al.: Exploring length generalization in large language models. In: Oh, A.H., Agarwal, A., Belgrave, D., Cho, K. (eds.) Advances in Neural Information Processing Systems (2022). https:\/\/openreview.net\/forum?id=zSkYVeX7bC4"},{"key":"14_CR4","unstructured":"Bengio, S., Vinyals, O., Jaitly, N., Shazeer, N.M.: Scheduled sampling for sequence prediction with recurrent neural networks. arXiv:abs\/1506.03099 (2015)"},{"key":"14_CR5","unstructured":"Bishop, C.M.: Mixture density networks (1994)"},{"key":"14_CR6","doi-asserted-by":"publisher","first-page":"89","DOI":"10.1007\/s10032-020-00350-4","volume":"23","author":"V Carbune","year":"2020","unstructured":"Carbune, V., et al.: Fast multi-language LSTM-based online handwriting recognition. Int. J. Doc. Anal. Recogn. (IJDAR) 23, 89\u2013102 (2020)","journal-title":"Int. J. Doc. Anal. Recogn. (IJDAR)"},{"key":"14_CR7","unstructured":"Chang, J.H.R., Shrivastava, A., Koppula, H.S., Zhang, X., Tuzel, O.: Style equalization: Unsupervised learning of controllable generative sequence models (2022). https:\/\/arxiv.org\/abs\/2110.02891"},{"key":"14_CR8","unstructured":"Chen, T., Kornblith, S., Norouzi, M., Hinton, G.: A simple framework for contrastive learning of visual representations (2020)"},{"key":"14_CR9","doi-asserted-by":"publisher","unstructured":"Chiu, C.C., et al.: RNN-T models fail to generalize to out-of-domain audio: causes and solutions, pp. 873\u2013880 (2021). https:\/\/doi.org\/10.1109\/SLT48900.2021.9383518","DOI":"10.1109\/SLT48900.2021.9383518"},{"key":"14_CR10","doi-asserted-by":"publisher","unstructured":"Dai, Z., Yang, Z., Yang, Y., Carbonell, J., Le, Q.V., Salakhutdinov, R.: Transformer-xl: attentive language models beyond a fixed-length context (2019). https:\/\/doi.org\/10.48550\/ARXIV.1901.02860, https:\/\/arxiv.org\/abs\/1901.02860","DOI":"10.48550\/ARXIV.1901.02860"},{"key":"14_CR11","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"632","DOI":"10.1007\/978-3-030-58574-7_38","volume-title":"Computer Vision \u2013 ECCV 2020","author":"A Das","year":"2020","unstructured":"Das, A., Yang, Y., Hospedales, T., Xiang, T., Song, Y.-Z.: B\u00e9zierSketch: a generative model for scalable vector sketches. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12371, pp. 632\u2013647. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58574-7_38"},{"key":"14_CR12","doi-asserted-by":"crossref","unstructured":"Djioua, M., Plamondon, R.: An interactive system for the automatic generation of huge handwriting databases from a few specimens. In: 2008 19th International Conference on Pattern Recognition, pp. 1\u20134 (2008)","DOI":"10.1109\/ICPR.2008.4761931"},{"issue":"4","key":"14_CR13","doi-asserted-by":"publisher","first-page":"455","DOI":"10.1007\/s10032-014-0231-x","volume":"17","author":"Y Elarian","year":"2014","unstructured":"Elarian, Y., Abdel-Aal, R., Ahmad, I., Parvez, M.T., Zidouri, A.: Handwriting synthesis: classifications and techniques. Int. J. Document Anal. Recogn. (IJDAR) 17(4), 455\u2013469 (2014). https:\/\/doi.org\/10.1007\/s10032-014-0231-x","journal-title":"Int. J. Document Anal. Recogn. (IJDAR)"},{"key":"14_CR14","doi-asserted-by":"crossref","unstructured":"Fisher, R.A.: On the interpretation of from contingency tables, and the calculation of p. J. Roy. Stat. Soc. 85 (1922). http:\/\/www.medicine.mcgill.ca","DOI":"10.2307\/2340521"},{"key":"14_CR15","doi-asserted-by":"crossref","unstructured":"Gan, J., Wang, W.: HIGAN: handwriting imitation conditioned on arbitrary-length texts and disentangled styles. In: AAAI Conference on Artificial Intelligence (2021)","DOI":"10.1609\/aaai.v35i9.16917"},{"key":"14_CR16","unstructured":"Graves, A.: Generating sequences with recurrent neural networks. arXiv:abs\/1308.0850 (2013)"},{"key":"14_CR17","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S Hochreiter","year":"1997","unstructured":"Hochreiter, S., Schmidhuber, J.: Long short-term memory. Neural Comput. 9, 1735\u201380 (1997). https:\/\/doi.org\/10.1162\/neco.1997.9.8.1735","journal-title":"Neural Comput."},{"key":"14_CR18","doi-asserted-by":"publisher","unstructured":"Hsu, W.N., et al.: Disentangling correlated speaker and noise for speech synthesis via data augmentation and adversarial factorization. In: ICASSP 2019\u20132019 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 5901\u20135905 (2019). https:\/\/doi.org\/10.1109\/ICASSP.2019.8683561","DOI":"10.1109\/ICASSP.2019.8683561"},{"key":"14_CR19","doi-asserted-by":"crossref","unstructured":"Huber, C., Hussain, J., St\u00fcker, S., Waibel, A.H.: Instant one-shot word-learning for context-specific neural sequence-to-sequence speech recognition. In: 2021 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU), pp. 1\u20137 (2021)","DOI":"10.1109\/ASRU51503.2021.9687898"},{"key":"14_CR20","doi-asserted-by":"crossref","unstructured":"Inderm\u00fchle, E., Liwicki, M., Bunke, H.: Iamondo-database: an online handwritten document database with non-uniform contents. In: International Workshop on Document Analysis Systems (2010)","DOI":"10.1145\/1815330.1815343"},{"key":"14_CR21","unstructured":"Ke, G., He, D., Liu, T.Y.: Rethinking the positional encoding in language pre-training (2020)"},{"key":"14_CR22","doi-asserted-by":"publisher","unstructured":"Koehn, P., Knowles, R.: Six challenges for neural machine translation. In: Proceedings of the First Workshop on Neural Machine Translation, Vancouver, August 2017, pp. 28\u201339. Association for Computational Linguistics (2017). https:\/\/doi.org\/10.18653\/v1\/W17-3204, https:\/\/aclanthology.org\/W17-3204","DOI":"10.18653\/v1\/W17-3204"},{"key":"14_CR23","doi-asserted-by":"publisher","unstructured":"Kondo, S., Hotate, K., Hirasawa, T., Kaneko, M., Komachi, M.: Sentence concatenation approach to data augmentation for neural machine translation, pp. 143\u2013149 (2021). https:\/\/doi.org\/10.18653\/v1\/2021.naacl-srw.18","DOI":"10.18653\/v1\/2021.naacl-srw.18"},{"key":"14_CR24","doi-asserted-by":"publisher","first-page":"387","DOI":"10.1007\/s10032-019-00336-x","volume":"22","author":"P Krishnan","year":"2019","unstructured":"Krishnan, P., Jawahar, C.: HWNET v2: an efficient word image representation for handwritten documents. Int. J. Doc. Anal. Recogn. (IJDAR) 22, 387\u2013405 (2019)","journal-title":"Int. J. Doc. Anal. Recogn. (IJDAR)"},{"key":"14_CR25","unstructured":"Lamb, A., Goyal, A., Zhang, Y., Zhang, S., Courville, A., Bengio, Y.: Professor forcing: a new algorithm for training recurrent networks (2016)"},{"key":"14_CR26","doi-asserted-by":"publisher","unstructured":"Lin, Z., Wan, L.: Style-preserving English handwriting synthesis. Pattern Recogn. 40(7), 2097\u20132109 (2007). https:\/\/doi.org\/10.1016\/j.patcog.2006.11.024, https:\/\/www.sciencedirect.com\/science\/article\/pii\/S0031320306004985","DOI":"10.1016\/j.patcog.2006.11.024"},{"key":"14_CR27","doi-asserted-by":"publisher","unstructured":"Liwicki, M., Bunke, H.: Iam-ondb - an on-line English sentence database acquired from handwritten text on a whiteboard. In: Eighth International Conference on Document Analysis and Recognition (ICDAR 2005), vol. 2, pp. 956\u2013961 (2005). https:\/\/doi.org\/10.1109\/ICDAR.2005.132","DOI":"10.1109\/ICDAR.2005.132"},{"key":"14_CR28","unstructured":"Lu, Z., et al.: Input length matters: improving RNN-T and MWER training for long-form telephony speech recognition (2021)"},{"key":"14_CR29","doi-asserted-by":"publisher","unstructured":"Luo, C., Zhu, Y., Jin, L., Li, Z., Peng, D.: Slogan: Handwriting style synthesis for arbitrary-length and out-of-vocabulary text (2022). https:\/\/doi.org\/10.48550\/ARXIV.2202.11456, https:\/\/arxiv.org\/abs\/2202.11456","DOI":"10.48550\/ARXIV.2202.11456"},{"key":"14_CR30","unstructured":"Maksai, A., Rowley, H., Berent, J., Musat, C.: INKORRECT: online handwriting spelling correction (2022)"},{"key":"14_CR31","doi-asserted-by":"publisher","unstructured":"Nallapati, R., Zhou, B., dos Santos, C., Gulcehre, C., Xiang, B.: Abstractive text summarization using sequence-to-sequence RNNs and beyond. In: Proceedings of the 20th SIGNLL Conference on Computational Natural Language Learning, Berlin, Germany, August 2016, pp. 280\u2013290. Association for Computational Linguistics (2016). https:\/\/doi.org\/10.18653\/v1\/K16-1028, https:\/\/aclanthology.org\/K16-1028","DOI":"10.18653\/v1\/K16-1028"},{"key":"14_CR32","doi-asserted-by":"publisher","unstructured":"Narayanan, A., Prabhavalkar, R., Chiu, C.C., Rybach, D., Sainath, T.N., Strohman, T.: Recognizing long-form speech using streaming end-to-end models. In: 2019 IEEE Automatic Speech Recognition and Understanding Workshop (ASRU), pp. 920\u2013927 (2019). https:\/\/doi.org\/10.1109\/ASRU46091.2019.9003913","DOI":"10.1109\/ASRU46091.2019.9003913"},{"key":"14_CR33","doi-asserted-by":"publisher","unstructured":"Neishi, M., Yoshinaga, N.: On the relation between position information and sentence length in neural machine translation. In: Proceedings of the 23rd Conference on Computational Natural Language Learning (CoNLL), Hong Kong, China, November 2019, pp. 328\u2013338. Association for Computational Linguistics (2019). https:\/\/doi.org\/10.18653\/v1\/K19-1031, https:\/\/aclanthology.org\/K19-1031","DOI":"10.18653\/v1\/K19-1031"},{"key":"14_CR34","doi-asserted-by":"crossref","unstructured":"Nguyen, H., Nguyen, C., Bao, P., Nakagawa, M.: A database of unconstrained vietnamese online handwriting and recognition experiments by recurrent neural networks. Pattern Recogn. 78, 291\u2013306 (2018)","DOI":"10.1016\/j.patcog.2018.01.013"},{"key":"14_CR35","doi-asserted-by":"publisher","unstructured":"Pechwitz, M., Margner, V.: Baseline estimation for Arabic handwritten words. In: Proceedings Eighth International Workshop on Frontiers in Handwriting Recognition, pp. 479\u2013484 (2002). https:\/\/doi.org\/10.1109\/IWFHR.2002.1030956","DOI":"10.1109\/IWFHR.2002.1030956"},{"key":"14_CR36","doi-asserted-by":"publisher","unstructured":"Raffel, C., et al.: Exploring the limits of transfer learning with a unified text-to-text transformer (2019). https:\/\/doi.org\/10.48550\/ARXIV.1910.10683, https:\/\/arxiv.org\/abs\/1910.10683","DOI":"10.48550\/ARXIV.1910.10683"},{"key":"14_CR37","doi-asserted-by":"publisher","unstructured":"Ribeiro, L.S.F., Bui, T., Collomosse, J., Ponti, M.: Sketchformer: Transformer-based representation for sketched structure (2020). https:\/\/doi.org\/10.48550\/ARXIV.2002.10381, https:\/\/arxiv.org\/abs\/2002.10381","DOI":"10.48550\/ARXIV.2002.10381"},{"key":"14_CR38","doi-asserted-by":"publisher","unstructured":"Schaldenbrand, P., Liu, Z., Oh, J.: Styleclipdraw: Coupling content and style in text-to-drawing translation (2022). https:\/\/doi.org\/10.48550\/ARXIV.2202.12362, https:\/\/arxiv.org\/abs\/2202.12362","DOI":"10.48550\/ARXIV.2202.12362"},{"key":"14_CR39","unstructured":"Sutskever, I., Vinyals, O., Le, Q.V.: Sequence to sequence learning with neural networks. In: Proceedings of the 27th International Conference on Neural Information Processing Systems. NIPS 2014, Cambridge, MA, USA, vol. 2, pp. 3104\u20133112. MIT Press (2014)"},{"key":"14_CR40","unstructured":"Thoppilan, R., et al.: LAMDA: language models for dialog applications (2022)"},{"key":"14_CR41","doi-asserted-by":"publisher","unstructured":"Varis, D., Bojar, O.: Sequence length is a domain: length-based overfitting in transformer models, pp. 8246\u20138257 (2021). https:\/\/doi.org\/10.18653\/v1\/2021.emnlp-main.650","DOI":"10.18653\/v1\/2021.emnlp-main.650"},{"key":"14_CR42","unstructured":"Vaswani, A., et al.: Attention is all you need. In: Guyon, I., et al. (eds.) Advances in Neural Information Processing Systems, vol. 30. Curran Associates, Inc. (2017), https:\/\/proceedings.neurips.cc\/paper\/2017\/file\/3f5ee243547dee91fbd053c1c4a845aa-Paper.pdf"},{"key":"14_CR43","doi-asserted-by":"publisher","unstructured":"Zhang, J.X., Ling, Z.H., Dai, L.R.: Forward attention in sequence- to-sequence acoustic modeling for speech synthesis. In: 2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP), pp. 4789\u20134793 (2018). https:\/\/doi.org\/10.1109\/ICASSP.2018.8462020","DOI":"10.1109\/ICASSP.2018.8462020"}],"container-title":["Lecture Notes in Computer Science","Document Analysis and Recognition - ICDAR 2023"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-41685-9_14","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,8,18]],"date-time":"2023-08-18T14:08:47Z","timestamp":1692367727000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-41685-9_14"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023]]},"ISBN":["9783031416842","9783031416859"],"references-count":43,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-41685-9_14","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023]]},"assertion":[{"value":"19 August 2023","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ICDAR","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Document Analysis and Recognition","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"San Jos\u00e9, CA","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"USA","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2023","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"21 August 2023","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"26 August 2023","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"17","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"icdar2023","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/icdar2023.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Easychair","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"316","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"154","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"49% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"2.89","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"1.50","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"No","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Number and type of other papers accepted : IJDAR track papers","order":10,"name":"additional_info_on_review_process","label":"Additional Info on Review Process","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}