{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,20]],"date-time":"2026-03-20T16:59:42Z","timestamp":1774025982864,"version":"3.50.1"},"reference-count":73,"publisher":"Springer Science and Business Media LLC","issue":"8","license":[{"start":{"date-parts":[[2024,7,22]],"date-time":"2024-07-22T00:00:00Z","timestamp":1721606400000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,7,22]],"date-time":"2024-07-22T00:00:00Z","timestamp":1721606400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Sci. China Inf. Sci."],"published-print":{"date-parts":[[2024,8]]},"DOI":"10.1007\/s11432-022-3859-8","type":"journal-article","created":{"date-parts":[[2024,7,24]],"date-time":"2024-07-24T11:10:19Z","timestamp":1721819419000},"update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["SeeMore: a spatiotemporal predictive model with bidirectional distillation and level-specific meta-adaptation"],"prefix":"10.1007","volume":"67","author":[{"given":"Yuqing","family":"Ma","sequence":"first","affiliation":[]},{"given":"Wei","family":"Liu","sequence":"additional","affiliation":[]},{"given":"Yajun","family":"Gao","sequence":"additional","affiliation":[]},{"given":"Yang","family":"Yuan","sequence":"additional","affiliation":[]},{"given":"Shihao","family":"Bai","sequence":"additional","affiliation":[]},{"given":"Haotong","family":"Qin","sequence":"additional","affiliation":[]},{"given":"Xianglong","family":"Liu","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,7,22]]},"reference":[{"key":"3859_CR1","doi-asserted-by":"publisher","first-page":"1106","DOI":"10.1007\/s11263-018-01144-2","volume":"127","author":"T F Xue","year":"2019","unstructured":"Xue T F, Chen B A, Wu J J, et al. Video enhancement with task-oriented flow. Int J Comput Vis, 2019, 127: 1106\u20131125","journal-title":"Int J Comput Vis"},{"key":"3859_CR2","doi-asserted-by":"crossref","unstructured":"Park J, Lee C, Kim C. Asymmetric bilateral motion estimation for video frame interpolation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, Montreal, 2021. 14519\u201314528","DOI":"10.1109\/ICCV48922.2021.01427"},{"key":"3859_CR3","doi-asserted-by":"crossref","unstructured":"Li H P, Yuan Y, Wang Q. Video frame interpolation via residue refinement. In: Proceedings of the IEEE International Conference on Acoustics, Speech and Signal Processing, Barcelona, 2020. 2613\u20132617","DOI":"10.1109\/ICASSP40776.2020.9053987"},{"key":"3859_CR4","unstructured":"Shi X J, Chen Z R, Wang H, et al. Convolutional LSTM network: a machine learning approach for precipitation nowcasting. In: Proceedings of the Advances in Neural Information Processing Systems, Montreal, 2015. 802\u2013810"},{"key":"3859_CR5","doi-asserted-by":"crossref","unstructured":"Wang Y B, Zhang J J, Zhu H Y, et al. Memory in memory: a predictive neural network for learning higher-order non-stationarity from spatiotemporal dynamics. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, Long Beach, 2019. 9154\u20139162","DOI":"10.1109\/CVPR.2019.00937"},{"key":"3859_CR6","doi-asserted-by":"publisher","first-page":"2208","DOI":"10.1109\/TPAMI.2022.3165153","volume":"45","author":"Y B Wang","year":"2023","unstructured":"Wang Y B, Wu H X, Zhang J J, et al. PredRNN: a recurrent neural network for spatiotemporal predictive learning. IEEE Trans Pattern Anal Mach Intell, 2023, 45: 2208\u20132225","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"3859_CR7","doi-asserted-by":"publisher","first-page":"212207","DOI":"10.1007\/s11432-019-2761-y","volume":"63","author":"G Xie","year":"2020","unstructured":"Xie G, Shangguan A Q, Fei R, et al. Motion trajectory prediction based on a CNN-LSTM sequential model. Sci China Inf Sci, 2020, 63: 212207","journal-title":"Sci China Inf Sci"},{"key":"3859_CR8","doi-asserted-by":"publisher","first-page":"172207","DOI":"10.1007\/s11432-020-3071-8","volume":"64","author":"H B Gao","year":"2021","unstructured":"Gao H B, Su H, Cai Y F, et al. Trajectory prediction of cyclist based on dynamic Bayesian network and long short-term memory model at unsignalized intersections. Sci China Inf Sci, 2021, 64: 172207","journal-title":"Sci China Inf Sci"},{"key":"3859_CR9","doi-asserted-by":"crossref","unstructured":"Zhao H, Wildes R P. Where are you heading? Dynamic trajectory prediction with expert goal examples. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, Montreal, 2021. 7609\u20137618","DOI":"10.1109\/ICCV48922.2021.00753"},{"key":"3859_CR10","doi-asserted-by":"publisher","first-page":"2716","DOI":"10.1109\/LRA.2022.3145090","volume":"7","author":"C H Wang","year":"2022","unstructured":"Wang C H, Wang Y C, Xu M Z, et al. Stepwise goal-driven networks for trajectory prediction. IEEE Robot Autom Lett, 2022, 7: 2716\u20132723","journal-title":"IEEE Robot Autom Lett"},{"key":"3859_CR11","doi-asserted-by":"crossref","unstructured":"Liang R, Li Y, Li X, et al. Temporal pyramid network for pedestrian trajectory prediction with multi-supervision. In: Proceedings of the 35th AAAI Conference on Artificial Intelligence, the 33rd Conference on Innovative Applications of Artificial Intelligence, the 11th Symposium on Educational Advances in Artificial Intelligence, Virtual Event, 2021. 2029\u20132037","DOI":"10.1609\/aaai.v35i3.16299"},{"key":"3859_CR12","doi-asserted-by":"crossref","unstructured":"Codevilla F, Santana E, Lopez A M, et al. Exploring the limitations of behavior cloning for autonomous driving. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, Seoul, 2019. 9328\u20139337","DOI":"10.1109\/ICCV.2019.00942"},{"key":"3859_CR13","doi-asserted-by":"crossref","unstructured":"Chen D, Koltun V, Kr\u00e4henb\u00fchl P. Learning to drive from a world on rails. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, Montreal, 2021. 15570\u201315579","DOI":"10.1109\/ICCV48922.2021.01530"},{"key":"3859_CR14","doi-asserted-by":"crossref","unstructured":"Chitta K, Prakash A, Geiger A. NEAT: neural attention fields for end-to-end autonomous driving. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, Montreal, 2021. 15773\u201315783","DOI":"10.1109\/ICCV48922.2021.01550"},{"key":"3859_CR15","unstructured":"Wang Y B, Jiang L, Yang M, et al. Eidetic 3D LSTM: a model for video prediction and beyond. In: Proceedings of the 7th International Conference on Learning Representations, New Orleans, 2019"},{"key":"3859_CR16","unstructured":"Yu W, Lu Y C, Easterbrook S, et al. Efficient and information-preserving future frame prediction and beyond. In: Proceedings of the 8th International Conference on Learning Representations, Addis Ababa, 2020"},{"key":"3859_CR17","unstructured":"Chang Z, Zhang X F, Wang S S, et al. MAU: a motion-aware unit for video prediction and beyond. In: Proceedings of the Advances in Neural Information Processing Systems, 2021. 26950\u201326962"},{"key":"3859_CR18","unstructured":"Su J H, Byeon W, Kossaifi J, et al. Convolutional tensor-train LSTM for spatio-temporal learning. In: Proceedings of the Advances in Neural Information Processing Systems, 2020"},{"key":"3859_CR19","unstructured":"Wang Y B, Long M S, Wang J M, et al. PredRNN: recurrent neural networks for predictive learning using spatiotemporal LSTMs. In: Proceedings of the Advances in Neural Information Processing Systems, Long Beach, 2017. 879\u2013888"},{"key":"3859_CR20","unstructured":"Wang Y B, Gao Z F, Long M S, et al. PredRNN+ +: towards a resolution of the deep-in-time dilemma in spatiotemporal predictive learning. In: Proceedings of the 35th International Conference on Machine Learning, Stockholm, 2018. 5110\u20135119"},{"key":"3859_CR21","unstructured":"Srivastava N, Mansimov E, Salakhutdinov R. Unsupervised learning of video representations using lstms. In: Proceedings of the 32nd International Conference on Machine Learning, Lille, 2015. 843\u2013852"},{"key":"3859_CR22","doi-asserted-by":"publisher","first-page":"102315","DOI":"10.1007\/s11432-011-4391-8","volume":"56","author":"M Deng","year":"2013","unstructured":"Deng M, Liu Q L, Wang J Q, et al. A general method of spatio-temporal clustering analysis. Sci China Inf Sci, 2013, 56: 102315","journal-title":"Sci China Inf Sci"},{"key":"3859_CR23","doi-asserted-by":"publisher","first-page":"140301","DOI":"10.1007\/s11432-019-2785-y","volume":"63","author":"J Li","year":"2020","unstructured":"Li J, Li Y F, He L, et al. Spatio-temporal fusion for remote sensing data: an overview and new benchmark. Sci China Inf Sci, 2020, 63: 140301","journal-title":"Sci China Inf Sci"},{"key":"3859_CR24","doi-asserted-by":"publisher","first-page":"2499","DOI":"10.1007\/s11432-011-4507-1","volume":"54","author":"C M Wang","year":"2011","unstructured":"Wang C M, Hu X P, Yao L, et al. Spatio-temporal pattern analysis of single-trial EEG signals recorded during visual object recognition. Sci China Inf Sci, 2011, 54: 2499\u20132507","journal-title":"Sci China Inf Sci"},{"key":"3859_CR25","doi-asserted-by":"publisher","first-page":"140302","DOI":"10.1007\/s11432-019-2805-y","volume":"63","author":"Y F Li","year":"2020","unstructured":"Li Y F, Li J, He L, et al. A new sensor bias-driven spatio-temporal fusion model based on convolutional neural networks. Sci China Inf Sci, 2020, 63: 140302","journal-title":"Sci China Inf Sci"},{"key":"3859_CR26","doi-asserted-by":"publisher","first-page":"160301","DOI":"10.1007\/s11432-020-2871-2","volume":"63","author":"Y F Ji","year":"2020","unstructured":"Ji Y F, Gu R T, Yang Z Y, et al. Artificial intelligence-driven autonomous optical networks: 3S architecture and key technologies. Sci China Inf Sci, 2020, 63: 160301","journal-title":"Sci China Inf Sci"},{"key":"3859_CR27","doi-asserted-by":"publisher","first-page":"110100","DOI":"10.1007\/s11432-017-9251-5","volume":"60","author":"J Tang","year":"2017","unstructured":"Tang J, Tong H H, Vazirgiannis M. Special focus on natural language processing and social computing. Sci China Inf Sci, 2017, 60: 110100","journal-title":"Sci China Inf Sci"},{"key":"3859_CR28","doi-asserted-by":"publisher","first-page":"229103","DOI":"10.1007\/s11432-018-9479-3","volume":"62","author":"X Y Liu","year":"2019","unstructured":"Liu X Y, Pan S D, Zhang Q, et al. Reformulating natural language queries using sequence-to-sequence models. Sci China Inf Sci, 2019, 62: 229103","journal-title":"Sci China Inf Sci"},{"key":"3859_CR29","doi-asserted-by":"publisher","first-page":"120101","DOI":"10.1007\/s11432-019-2710-7","volume":"63","author":"Y Z Gao","year":"2020","unstructured":"Gao Y Z, Chen Y Y, Wang J Q, et al. Progressive rectification network for irregular text recognition. Sci China Inf Sci, 2020, 63: 120101","journal-title":"Sci China Inf Sci"},{"key":"3859_CR30","doi-asserted-by":"publisher","first-page":"222104","DOI":"10.1007\/s11432-020-3116-x","volume":"64","author":"X B Zhou","year":"2021","unstructured":"Zhou X B, Wang Z Q, Zhou M, et al. Sentiment classification via user and product interactive modeling. Sci China Inf Sci, 2021, 64: 222104","journal-title":"Sci China Inf Sci"},{"key":"3859_CR31","doi-asserted-by":"publisher","first-page":"152102","DOI":"10.1007\/s11432-019-2740-1","volume":"64","author":"Q P Guo","year":"2021","unstructured":"Guo Q P, Qiu X P, Xue X Y, et al. Syntax-guided text generation via graph neural network. Sci China Inf Sci, 2021, 64: 152102","journal-title":"Sci China Inf Sci"},{"key":"3859_CR32","doi-asserted-by":"crossref","unstructured":"Oliu M, Selva J, Escalera S. Folded recurrent neural networks for future video prediction. In: Proceedings of the 15th European Conference on Computer Vision, Munich, 2018. 745\u2013761","DOI":"10.1007\/978-3-030-01264-9_44"},{"key":"3859_CR33","doi-asserted-by":"publisher","first-page":"7090","DOI":"10.1109\/TIP.2020.2998297","volume":"29","author":"X Y Chen","year":"2020","unstructured":"Chen X Y, Xu C, Yang X K, et al. Long-term video prediction via criticization and retrospection. IEEE Trans Image Process, 2020, 29: 7090\u20137103","journal-title":"IEEE Trans Image Process"},{"key":"3859_CR34","doi-asserted-by":"publisher","first-page":"2673","DOI":"10.1109\/78.650093","volume":"45","author":"M Schuster","year":"1997","unstructured":"Schuster M, Paliwal K K. Bidirectional recurrent neural networks. IEEE Trans Signal Process, 1997, 45: 2673\u20132681","journal-title":"IEEE Trans Signal Process"},{"key":"3859_CR35","doi-asserted-by":"publisher","first-page":"118484","DOI":"10.1016\/j.eswa.2022.118484","volume":"210","author":"K S Tan","year":"2022","unstructured":"Tan K S, Lim K M, Lee C P, et al. Bidirectional long short-term memory with temporal dense sampling for human action recognition. Expert Syst Appl, 2022, 210: 118484","journal-title":"Expert Syst Appl"},{"key":"3859_CR36","doi-asserted-by":"crossref","unstructured":"Ma Y Q, Liu W, Bai S H, et al. Few-shot visual learning with contextual memory and fine-grained calibration. In: Proceedings of the 29th International Conference on International Joint Conferences on Artificial Intelligence, 2021. 811\u2013817","DOI":"10.24963\/ijcai.2020\/113"},{"key":"3859_CR37","doi-asserted-by":"crossref","unstructured":"Zhang J B, Zheng Y, Qi D K, et al. DNN-based prediction model for spatio-temporal data. In: Proceedings of the 24th ACM SIGSPATIAL International Conference on Advances in Geographic Information Systems, 2016. 1\u20134","DOI":"10.1145\/2996913.2997016"},{"key":"3859_CR38","doi-asserted-by":"crossref","unstructured":"Zhang J B, Zheng Y, Qi D K. Deep spatio-temporal residual networks for citywide crowd flows prediction. In: Proceedings of the 31st AAAI Conference on Artificial Intelligence, San Francisco, 2017. 1655\u20131661","DOI":"10.1609\/aaai.v31i1.10735"},{"key":"3859_CR39","unstructured":"Finn C, Goodfellow I J, Levine S. Unsupervised learning for physical interaction through video prediction. In: Proceedings of the Advances in Neural Information Processing Systems, Barcelona, 2016. 64\u201372"},{"key":"3859_CR40","unstructured":"Jia X, Brabandere B D, Tuytelaars T, et al. Dynamic filter networks. In: Proceedings of the Advances in Neural Information Processing Systems, Barcelona, 2016. 667\u2013675"},{"key":"3859_CR41","unstructured":"Kalchbrenner N, van den Oord A, Simonyan K, et al. Video pixel networks. In: Proceedings of the 34th International Conference on Machine Learning, Sydney, 2017. 1771\u20131779"},{"key":"3859_CR42","unstructured":"Shi X J, Gao Z H, Lausen L, et al. Deep learning for precipitation nowcasting: a benchmark and a new model. In: Proceedings of the Advances in Neural Information Processing Systems 30, Long Beach, 2017. 5617\u20135627"},{"key":"3859_CR43","doi-asserted-by":"crossref","unstructured":"Lin Z H, Li M M, Zheng Z B, et al. Self-attention ConvLSTM for spatiotemporal prediction. In: Proceedings of the 34th AAAI Conference on Artificial Intelligence, the 32nd Innovative Applications of Artificial Intelligence Conference, the 10th AAAI Symposium on Educational Advances in Artificial Intelligence, New York, 2020. 11531\u201311538","DOI":"10.1609\/aaai.v34i07.6819"},{"key":"3859_CR44","doi-asserted-by":"crossref","unstructured":"Guo Y H, Shi H H, Kumar A, et al. SpotTune: transfer learning through adaptive fine-tuning. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR), 2019","DOI":"10.1109\/CVPR.2019.00494"},{"key":"3859_CR45","unstructured":"You K C, Kou Z, Long M S, et al. Co-tuning for transfer learning. In: Proceedings of the Advances in Neural Information Processing Systems, 2020. 33"},{"key":"3859_CR46","doi-asserted-by":"publisher","first-page":"149","DOI":"10.1109\/TIP.2021.3128311","volume":"31","author":"H T Tian","year":"2022","unstructured":"Tian H T, Qu S R, Payeur P. A prototypical knowledge oriented adaptation framework for semantic segmentation. IEEE Trans Image Process, 2022, 31: 149\u2013163","journal-title":"IEEE Trans Image Process"},{"key":"3859_CR47","doi-asserted-by":"publisher","first-page":"120111","DOI":"10.1007\/s11432-019-2722-3","volume":"63","author":"Y P Gao","year":"2020","unstructured":"Gao Y P, Li X Y, Gao L. Discriminative stacked autoencoder for feature representation and classification. Sci China Inf Sci, 2020, 63: 120111","journal-title":"Sci China Inf Sci"},{"key":"3859_CR48","doi-asserted-by":"publisher","first-page":"192106","DOI":"10.1007\/s11432-020-3112-8","volume":"64","author":"J M Fang","year":"2021","unstructured":"Fang J M, Chen Y K, Zhang X B, et al. EAT-NAS: elastic architecture transfer for accelerating large-scale neural architecture search. Sci China Inf Sci, 2021, 64: 192106","journal-title":"Sci China Inf Sci"},{"key":"3859_CR49","unstructured":"Hinton G, Vinyals O, Dean J, et al. Distilling the knowledge in a neural network. 2015. ArXiv:1503.02531"},{"key":"3859_CR50","unstructured":"Romero A, Ballas N, Kahou S E, et al. FitNets: hints for thin deep nets. 2014. ArXiv:1412.6550"},{"key":"3859_CR51","doi-asserted-by":"crossref","unstructured":"Zhang L F, Song J B, Gao A N, et al. Be your own teacher: improve the performance of convolutional neural networks via self distillation. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision, 2019. 3713\u20133722","DOI":"10.1109\/ICCV.2019.00381"},{"key":"3859_CR52","doi-asserted-by":"crossref","unstructured":"Zhang Y, Xiang T, Hospedales T M, et al. Deep mutual learning. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2018. 4320\u20134328","DOI":"10.1109\/CVPR.2018.00454"},{"key":"3859_CR53","doi-asserted-by":"publisher","first-page":"229101","DOI":"10.1007\/s11432-020-3162-4","volume":"65","author":"L H Guo","year":"2022","unstructured":"Guo L H, Chen D W, Jia K. Knowledge transferred adaptive filter pruning for CNN compression and acceleration. Sci China Inf Sci, 2022, 65: 229101","journal-title":"Sci China Inf Sci"},{"key":"3859_CR54","doi-asserted-by":"publisher","first-page":"120102","DOI":"10.1007\/s11432-020-2900-x","volume":"64","author":"F L Mao","year":"2021","unstructured":"Mao F L, Ma B P, Chang H, et al. Learning efficient text-to-image synthesis via interstage cross-sample similarity distillation. Sci China Inf Sci, 2021, 64: 120102","journal-title":"Sci China Inf Sci"},{"key":"3859_CR55","unstructured":"Finn C, Abbeel P, Levine S. Model-agnostic meta-learning for fast adaptation of deep networks. In: Proceedings of the 34th International Conference on Machine Learning, Sydney, 2017. 1126\u20131135"},{"key":"3859_CR56","unstructured":"Rusu A A, Rao D, Sygnowski J, et al. Meta-learning with latent embedding optimization. In: Proceedings of the 7th International Conference on Learning Representations, New Orleans, 2019"},{"key":"3859_CR57","unstructured":"Nichol A, Achiam J, Schulman J. On first-order meta-learning algorithms. 2018. ArXiv:1803.02999"},{"key":"3859_CR58","doi-asserted-by":"publisher","first-page":"130103","DOI":"10.1007\/s11432-020-3055-1","volume":"64","author":"N Pang","year":"2021","unstructured":"Pang N, Zhao X, Wang W, et al. Few-shot text classification by leveraging bi-directional attention and cross-class knowledge. Sci China Inf Sci, 2021, 64: 130103","journal-title":"Sci China Inf Sci"},{"key":"3859_CR59","doi-asserted-by":"publisher","first-page":"120104","DOI":"10.1007\/s11432-020-3156-7","volume":"64","author":"G Cheng","year":"2021","unstructured":"Cheng G, Li R M, Lang C B, et al. Task-wise attention guided part complementary learning for few-shot image classification. Sci China Inf Sci, 2021, 64: 120104","journal-title":"Sci China Inf Sci"},{"key":"3859_CR60","doi-asserted-by":"publisher","first-page":"192105","DOI":"10.1007\/s11432-020-2973-7","volume":"64","author":"M T Chen","year":"2021","unstructured":"Chen M T, Wang X G, Luo H, et al. Learning to focus: cascaded feature matching network for few-shot image recognition. Sci China Inf Sci, 2021, 64: 192105","journal-title":"Sci China Inf Sci"},{"key":"3859_CR61","doi-asserted-by":"crossref","unstructured":"Kweon W, Kang S, Yu H. Bidirectional distillation for top-k recommender system. In: Proceedings of the Web Conference 2021, 2021. 3861\u20133871","DOI":"10.1145\/3442381.3449878"},{"key":"3859_CR62","unstructured":"Antoniou A, Edwards H, Storkey A. How to train your MAML. 2018. ArXiv:1810.09502"},{"key":"3859_CR63","unstructured":"Li Z G, Zhou F W, Chen F, et al. Meta-SGD: learning to learn quickly for few shot learning. 2017. ArXiv:1707.09835"},{"key":"3859_CR64","doi-asserted-by":"crossref","unstructured":"Sun Q R, Liu Y Y, Chua T S, et al. Meta-transfer learning for few-shot learning. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, 2019. 403\u2013412","DOI":"10.1109\/CVPR.2019.00049"},{"key":"3859_CR65","doi-asserted-by":"crossref","unstructured":"Sch\u00fcldt C, Laptev I, Caputo B. Recognizing human actions: a local SVM approach. In: Proceedings of the 17th International Conference on Pattern Recognition, Cambridge, 2004. 32\u201336","DOI":"10.1109\/ICPR.2004.1334462"},{"key":"3859_CR66","doi-asserted-by":"publisher","first-page":"1325","DOI":"10.1109\/TPAMI.2013.248","volume":"36","author":"C Ionescu","year":"2014","unstructured":"Ionescu C, Papava D, Olaru V, et al. Human3.6M: large scale datasets and predictive methods for 3D human sensing in natural environments. IEEE Trans Pattern Anal Mach Intell, 2014, 36: 1325\u20131339","journal-title":"IEEE Trans Pattern Anal Mach Intell"},{"key":"3859_CR67","unstructured":"Kingma D P, Ba J. Adam: a method for stochastic optimization. In: Proceedings of the 3rd International Conference on Learning Representations, San Diego, 2015"},{"key":"3859_CR68","doi-asserted-by":"publisher","first-page":"600","DOI":"10.1109\/TIP.2003.819861","volume":"13","author":"Z Wang","year":"2004","unstructured":"Wang Z, Bovik A C, Sheikh H R, et al. Image quality assessment: from error visibility to structural similarity. IEEE Trans Image Process, 2004, 13: 600\u2013612","journal-title":"IEEE Trans Image Process"},{"key":"3859_CR69","doi-asserted-by":"crossref","unstructured":"Zhang R, Isola P, Efros A A, et al. The unreasonable effectiveness of deep features as a perceptual metric. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, Salt Lake City, 2018. 586\u2013595","DOI":"10.1109\/CVPR.2018.00068"},{"key":"3859_CR70","unstructured":"Krizhevsky A, Sutskever I, Hinton G E. ImageNet classification with deep convolutional neural networks. In: Proceedings of the Advances in Neural Information Processing Systems, 2012. 1106\u20131114"},{"key":"3859_CR71","doi-asserted-by":"crossref","unstructured":"Wu H X, Yao Z Y, Wang J M, et al. MotionRNN: a flexible model for video prediction with spacetime-varying motions. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, 2021. 15435\u201315444","DOI":"10.1109\/CVPR46437.2021.01518"},{"key":"3859_CR72","doi-asserted-by":"crossref","unstructured":"Chang Z, Zhang X F, Wang S S, et al. STRPM: a spatiotemporal residual predictive model for high-resolution video prediction. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, New Orleans, 2022. 13926\u201313935","DOI":"10.1109\/CVPR52688.2022.01356"},{"key":"3859_CR73","unstructured":"Villegas R, Yang J M, Hong S, et al. Decomposing motion and content for natural video sequence prediction. In: Proceedings of the 5th International Conference on Learning Representations, Toulon, 2017"}],"container-title":["Science China Information Sciences"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11432-022-3859-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s11432-022-3859-8\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s11432-022-3859-8.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,19]],"date-time":"2025-09-19T19:40:33Z","timestamp":1758310833000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s11432-022-3859-8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,7,22]]},"references-count":73,"journal-issue":{"issue":"8","published-print":{"date-parts":[[2024,8]]}},"alternative-id":["3859"],"URL":"https:\/\/doi.org\/10.1007\/s11432-022-3859-8","relation":{},"ISSN":["1674-733X","1869-1919"],"issn-type":[{"value":"1674-733X","type":"print"},{"value":"1869-1919","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024,7,22]]},"assertion":[{"value":"19 July 2022","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"31 March 2023","order":2,"name":"revised","label":"Revised","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"4 September 2023","order":3,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"22 July 2024","order":4,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}}],"article-number":"182104"}}