{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,2]],"date-time":"2026-01-02T07:48:12Z","timestamp":1767340092341,"version":"3.37.3"},"reference-count":39,"publisher":"Springer Science and Business Media LLC","issue":"3","license":[{"start":{"date-parts":[[2019,7,2]],"date-time":"2019-07-02T00:00:00Z","timestamp":1562025600000},"content-version":"tdm","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2019,7,2]],"date-time":"2019-07-02T00:00:00Z","timestamp":1562025600000},"content-version":"vor","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"crossref","award":["U1636124"],"award-info":[{"award-number":["U1636124"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"crossref"}]}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["IJDAR"],"published-print":{"date-parts":[[2019,9]]},"DOI":"10.1007\/s10032-019-00328-x","type":"journal-article","created":{"date-parts":[[2019,7,2]],"date-time":"2019-07-02T18:10:31Z","timestamp":1562091031000},"page":"235-246","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":7,"title":["Dynamic temporal residual network for sequence modeling"],"prefix":"10.1007","volume":"22","author":[{"given":"Ruijie","family":"Yan","sequence":"first","affiliation":[]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7793-1039","authenticated-orcid":false,"given":"Liangrui","family":"Peng","sequence":"additional","affiliation":[]},{"given":"Shanyu","family":"Xiao","sequence":"additional","affiliation":[]},{"given":"Michael T.","family":"Johnson","sequence":"additional","affiliation":[]},{"given":"Shengjin","family":"Wang","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2019,7,2]]},"reference":[{"issue":"3","key":"328_CR1","doi-asserted-by":"publisher","first-page":"275","DOI":"10.1007\/s10032-014-0218-7","volume":"17","author":"GA Abandah","year":"2014","unstructured":"Abandah, G.A., Jamour, F.T., Qaralleh, E.A.: Recognizing handwritten Arabic words using grapheme segmentation and recurrent neural networks. Int. J. Doc. Anal. Recognit. 17(3), 275\u2013291 (2014)","journal-title":"Int. J. Doc. Anal. Recognit."},{"key":"328_CR2","unstructured":"Amodei, D., Ananthanarayanan, S., Anubhai, R., Bai, J., Battenberg, E., Case, C., Casper, J., Catanzaro, B., Cheng, Q., Chen, G., et al.: Deep speech 2: end-to-end speech recognition in English and Mandarin. In: Proceedings of the International Conference on Machine Learning, pp. 173\u2013182 (2016)"},{"key":"328_CR3","doi-asserted-by":"crossref","unstructured":"Bluche, T., Louradour, J., Messina, R.: Scan, attend and read: end-to-end handwritten paragraph recognition with MDLSTM attention. In: Proceedings of the International Conference on Document Analysis and Recognition, vol. 1, pp. 1050\u20131055 (2017)","DOI":"10.1109\/ICDAR.2017.174"},{"key":"328_CR4","unstructured":"Chang, S., Zhang, Y., Han, W., Yu, M., Guo, X., Tan, W., Cui, X., Witbrock, M., Hasegawa-Johnson, M.A., Huang, T.S.: Dilated recurrent neural networks. In: Advances in Neural Information Processing Systems, pp. 77\u201387 (2017)"},{"issue":"7","key":"328_CR5","doi-asserted-by":"publisher","first-page":"1185","DOI":"10.1109\/TASLP.2016.2539499","volume":"24","author":"K Chen","year":"2016","unstructured":"Chen, K., Huo, Q.: Training deep bidirectional LSTM acoustic model for LVCSR by a context-sensitive-chunk BPTT approach. IEEE Trans. Audio Speech Lang. Process. 24(7), 1185\u20131193 (2016)","journal-title":"IEEE Trans. Audio Speech Lang. Process."},{"key":"328_CR6","unstructured":"Chorowski, J., Jaitly, N.: Towards better decoding and language model integration in sequence to sequence models (2016). arXiv preprint \n                    arXiv:1612.02695"},{"issue":"4","key":"328_CR7","doi-asserted-by":"publisher","first-page":"357","DOI":"10.1109\/TASSP.1980.1163420","volume":"28","author":"S Davis","year":"1980","unstructured":"Davis, S., Mermelstein, P.: Comparison of parametric representations for monosyllabic word recognition in continuously spoken sentences. IEEE Trans. Acoust. Speech Signal Process. 28(4), 357\u2013366 (1980)","journal-title":"IEEE Trans. Acoust. Speech Signal Process."},{"key":"328_CR8","doi-asserted-by":"crossref","unstructured":"Ding, H., Chen, K., Yuan, Y., Cai, M., Sun, L., Liang, S., Huo, Q.: A compact CNN-DBLSTM based character model for offline handwriting recognition with Tucker decomposition. In: Proceedings of the International Conference on Document Analysis and Recognition, pp. 507\u2013512 (2017)","DOI":"10.1109\/ICDAR.2017.89"},{"issue":"2","key":"328_CR9","doi-asserted-by":"publisher","first-page":"179","DOI":"10.1207\/s15516709cog1402_1","volume":"14","author":"JL Elman","year":"1990","unstructured":"Elman, J.L.: Finding structure in time. Cognit. Sci. 14(2), 179\u2013211 (1990)","journal-title":"Cognit. Sci."},{"key":"328_CR10","doi-asserted-by":"crossref","unstructured":"Garofolo, J.S., Lamel, L.F., Fisher, W.M., Fiscus, J.G., Pallett, D.S., Dahlgren, N.L.: DARPA TIMIT acoustic-phonetic continuous speech corpus CD-ROM. NIST speech disc 1-1.1. NASA STI\/Recon technical report 93 (1993)","DOI":"10.6028\/NIST.IR.4930"},{"key":"328_CR11","doi-asserted-by":"crossref","unstructured":"Graves, A.: Connectionist temporal classification. In: Supervised Sequence Labelling with Recurrent Neural Networks, pp. 5\u201313. Springer (2012)","DOI":"10.1007\/978-3-642-24797-2_2"},{"key":"328_CR12","doi-asserted-by":"crossref","unstructured":"Graves, A.: Offline Arabic handwriting recognition with multidimensional recurrent neural networks. In: Guide to OCR for Arabic Scripts, pp. 297\u2013313. Springer (2012)","DOI":"10.1007\/978-1-4471-4072-6_12"},{"key":"328_CR13","doi-asserted-by":"crossref","unstructured":"Graves, A., Mohamed, A., Hinton, G.: Speech recognition with deep recurrent neural networks. In: Proceedings of the International Conference on Acoustics, Speech and Signal Processing, pp. 6645\u20136649 (2013)","DOI":"10.1109\/ICASSP.2013.6638947"},{"key":"328_CR14","doi-asserted-by":"crossref","unstructured":"Grosicki, E., Carre, M., Brodin, J.M., Geoffrois, E.: RIMES evaluation campaign for handwritten mail processing. In: Proceedings of the International Conference on Frontiers in Handwriting Recognition, pp. 1\u20136 (2008)","DOI":"10.1109\/ICDAR.2009.224"},{"key":"328_CR15","unstructured":"Gui, T., Zhang, Q., Zhao, L., Lin, Y., Peng, M., Gong, J., Huang, X.: Long short-term memory with dynamic skip connections (2018). arXiv preprint \n                    arXiv:1811.03873"},{"key":"328_CR16","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"issue":"2","key":"328_CR17","doi-asserted-by":"publisher","first-page":"107","DOI":"10.1142\/S0218488598000094","volume":"6","author":"S Hochreiter","year":"1998","unstructured":"Hochreiter, S.: The vanishing gradient problem during learning recurrent neural nets and problem solutions. Int. J. Uncertain. Fuzziness Knowl. Based Syst. 6(2), 107\u2013116 (1998)","journal-title":"Int. J. Uncertain. Fuzziness Knowl. Based Syst."},{"issue":"8","key":"328_CR18","doi-asserted-by":"publisher","first-page":"1735","DOI":"10.1162\/neco.1997.9.8.1735","volume":"9","author":"S Hochreiter","year":"1997","unstructured":"Hochreiter, S., Schmidhuber, J.: Long short-term memory. Neural Comput. 9(8), 1735\u20131780 (1997)","journal-title":"Neural Comput."},{"key":"328_CR19","doi-asserted-by":"crossref","unstructured":"Hu, W., Cai, M., Chen, K., Ding, H., Sun, L., Liang, S., Mo, X., Huo, Q.: Sequence discriminative training for offline handwriting recognition by an interpolated CTC and lattice-free MMI objective function. In: Proceedings of the International Conference on Document Analysis and Recognition, pp. 61\u201366 (2017)","DOI":"10.1109\/ICDAR.2017.19"},{"key":"328_CR20","unstructured":"Ioffe, S., Szegedy, C.: Batch normalization: Accelerating deep network training by reducing internal covariate shift (2015). arXiv preprint \n                    arXiv:1502.03167"},{"issue":"11","key":"328_CR21","doi-asserted-by":"publisher","first-page":"1641","DOI":"10.1109\/29.46546","volume":"37","author":"KF Lee","year":"1989","unstructured":"Lee, K.F., Hon, H.W.: Speaker-independent phone recognition using hidden Markov models. IEEE Trans. Acoust. Speech Signal Process. 37(11), 1641\u20131648 (1989)","journal-title":"IEEE Trans. Acoust. Speech Signal Process."},{"issue":"1","key":"328_CR22","doi-asserted-by":"publisher","first-page":"39","DOI":"10.1007\/s100320200071","volume":"5","author":"U Marti","year":"2002","unstructured":"Marti, U., Bunke, H.: The IAM-database: an English sentence database for offline handwriting recognition. Int. J. Doc. Anal. Recognit. 5(1), 39\u201346 (2002)","journal-title":"Int. J. Doc. Anal. Recognit."},{"key":"328_CR23","doi-asserted-by":"crossref","unstructured":"Menasri, F., Louradour, J., Bianne-Bernard, A.L., Kermorvant, C.: The A2iA French handwriting recognition system at the Rimes-ICDAR2011 competition. In: Proceedings of Document Recognition and Retrieval, p. 8297Y (2012)","DOI":"10.1117\/12.911981"},{"key":"328_CR24","unstructured":"Pascanu, R., Gulcehre, C., Cho, K., Bengio, Y.: How to construct deep recurrent neural networks (2013). arXiv preprint \n                    arXiv:1312.6026"},{"key":"328_CR25","unstructured":"Paszke, A., Gross, S., Soumith, C., et. al.: Automatic differentiation in PyTorch. In: NIPS 2017 Autodiff Workshop (2017)"},{"key":"328_CR26","unstructured":"Pechwitz, M., Maddouri, S.S., M\u00e4rgner, V., Ellouze, N., Amiri, H., et al.: IFN\/ENIT-database of handwritten Arabic words. In: Proceedings of the Colloque International Francophone sur l\u2019Ecrit et le Document, vol. 2, pp. 127\u2013136 (2002)"},{"key":"328_CR27","doi-asserted-by":"crossref","unstructured":"Pei, W., Baltrusaitis, T., Tax, D.M., Morency, L.P.: Temporal attention-gated model for robust sequence classification. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 820\u2013829 (2017)","DOI":"10.1109\/CVPR.2017.94"},{"key":"328_CR28","doi-asserted-by":"crossref","unstructured":"Pham, V., Bluche, T., Kermorvant, C., Louradour, J.: Dropout improves recurrent neural networks for handwriting recognition. In: Proceedings of the International Conference on Frontiers in Handwriting Recognition, pp. 285\u2013290 (2014)","DOI":"10.1109\/ICFHR.2014.55"},{"key":"328_CR29","doi-asserted-by":"crossref","unstructured":"Puigcerver, J.: Are multidimensional recurrent layers really necessary for handwritten text recognition? In: Proceedings of the International Conference on Document Analysis and Recognition, pp. 67\u201372 (2017)","DOI":"10.1109\/ICDAR.2017.20"},{"key":"328_CR30","unstructured":"Puigcerver, J., Martin-Albo, D., Villegas, M.: Laia: a deep learning toolkit for HTR. \n                    https:\/\/github.com\/jpuigcerver\/Laia\n                    \n                   (2016). GitHub repository"},{"issue":"11","key":"328_CR31","doi-asserted-by":"publisher","first-page":"2298","DOI":"10.1109\/TPAMI.2016.2646371","volume":"39","author":"B Shi","year":"2017","unstructured":"Shi, B., Bai, X., Yao, C.: An end-to-end trainable neural network for image-based sequence recognition and its application to scene text recognition. IEEE Trans. Pattern Anal. Mach. Intell. 39(11), 2298\u20132304 (2017)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"328_CR32","unstructured":"Srivastava, R.K., Greff, K., Schmidhuber, J.: Highway networks (2015). arXiv preprint \n                    arXiv:1505.00387"},{"key":"328_CR33","unstructured":"Tieleman, T., Hinton, G.: Lecture 6.5-RmsProp: divide the gradient by a running average of its recent magnitude. In: COURSERA: Neural Networks for Machine Learning (2012)"},{"key":"328_CR34","unstructured":"Vaswani, A., Shazeer, N., Parmar, N., Uszkoreit, J., Jones, L., Gomez, A.N., Kaiser, \u0141., Polosukhin, I.: Attention is all you need. In: Advances in Neural Information Processing Systems, pp. 5998\u20136008 (2017)"},{"key":"328_CR35","unstructured":"Wu, Y., Schuster, M., Chen, Z., et\u00a0al.: Google\u2019s neural machine translation system: bridging the gap between human and machine translation (2016). arXiv preprint \n                    arXiv:1609.08144"},{"key":"328_CR36","doi-asserted-by":"crossref","unstructured":"Wu, Y.C., Yin, F., Chen, Z., Liu, C.L.: Handwritten Chinese text recognition using separable multi-dimensional recurrent neural network. In: Proceedings of the International Conference on Document Analysis and Recognition, pp. 79\u201384 (2017)","DOI":"10.1109\/ICDAR.2017.22"},{"key":"328_CR37","doi-asserted-by":"crossref","unstructured":"Yousefi, M.R., Soheili, M.R., Breuel, T.M., Stricker, D.: A comparison of 1D and 2D LSTM architectures for the recognition of handwritten Arabic. In: Proceedings of Document Recognition and Retrieval, p. 94020H (2015)","DOI":"10.1117\/12.2075930"},{"issue":"3","key":"328_CR38","doi-asserted-by":"publisher","first-page":"56","DOI":"10.3390\/info9030056","volume":"9","author":"B Yue","year":"2018","unstructured":"Yue, B., Fu, J., Liang, J.: Residual recurrent neural networks for learning sequential representations. Information 9(3), 56 (2018)","journal-title":"Information"},{"key":"328_CR39","doi-asserted-by":"crossref","unstructured":"Zhang, Y., Chen, G., Yu, D., Yaco, K., Khudanpur, S., Glass, J.: Highway long short-term memory RNNs for distant speech recognition. In: Proceedings of the International Conference on Acoustics, Speech and Signal Processing, pp. 5755\u20135759 (2016)","DOI":"10.1109\/ICASSP.2016.7472780"}],"container-title":["International Journal on Document Analysis and Recognition (IJDAR)"],"original-title":[],"language":"en","link":[{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10032-019-00328-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/article\/10.1007\/s10032-019-00328-x\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"http:\/\/link.springer.com\/content\/pdf\/10.1007\/s10032-019-00328-x.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2020,6,30]],"date-time":"2020-06-30T23:59:39Z","timestamp":1593561579000},"score":1,"resource":{"primary":{"URL":"http:\/\/link.springer.com\/10.1007\/s10032-019-00328-x"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2019,7,2]]},"references-count":39,"journal-issue":{"issue":"3","published-print":{"date-parts":[[2019,9]]}},"alternative-id":["328"],"URL":"https:\/\/doi.org\/10.1007\/s10032-019-00328-x","relation":{},"ISSN":["1433-2833","1433-2825"],"issn-type":[{"type":"print","value":"1433-2833"},{"type":"electronic","value":"1433-2825"}],"subject":[],"published":{"date-parts":[[2019,7,2]]},"assertion":[{"value":"16 November 2018","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"15 April 2019","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"11 June 2019","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"2 July 2019","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}]}}