{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,6]],"date-time":"2026-03-06T04:12:35Z","timestamp":1772770355891,"version":"3.50.1"},"publisher-location":"Cham","reference-count":40,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031721199","type":"print"},{"value":"9783031721205","type":"electronic"}],"license":[{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2024]]},"DOI":"10.1007\/978-3-031-72120-5_61","type":"book-chapter","created":{"date-parts":[[2024,10,2]],"date-time":"2024-10-02T12:02:53Z","timestamp":1727870573000},"page":"656-666","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":3,"title":["Spatiotemporal Representation Learning for\u00a0Short and\u00a0Long Medical Image Time Series"],"prefix":"10.1007","author":[{"given":"Chengzhi","family":"Shen","sequence":"first","affiliation":[]},{"given":"Martin J.","family":"Menten","sequence":"additional","affiliation":[]},{"given":"Hrvoje","family":"Bogunovi\u0107","sequence":"additional","affiliation":[]},{"given":"Ursula","family":"Schmidt-Erfurth","sequence":"additional","affiliation":[]},{"given":"Hendrik P. N.","family":"Scholl","sequence":"additional","affiliation":[]},{"given":"Sobha","family":"Sivaprasad","sequence":"additional","affiliation":[]},{"given":"Andrew","family":"Lotery","sequence":"additional","affiliation":[]},{"given":"Daniel","family":"Rueckert","sequence":"additional","affiliation":[]},{"given":"Paul","family":"Hager","sequence":"additional","affiliation":[]},{"given":"Robbie","family":"Holland","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,10,3]]},"reference":[{"key":"61_CR1","doi-asserted-by":"crossref","unstructured":"Assran, M., et\u00a0al.: Self-supervised learning from images with a joint-embedding predictive architecture. In: CVPR. pp. 15619\u201315629 (2023)","DOI":"10.1109\/CVPR52729.2023.01499"},{"key":"61_CR2","unstructured":"Bardes, A., et\u00a0al.: V-jepa: Latent video prediction for visual representation learning (2023)"},{"issue":"11","key":"61_CR3","first-page":"2514","volume":"37","author":"O Bernard","year":"2018","unstructured":"Bernard, O., et\u00a0al.: Deep learning techniques for automatic mri cardiac multi-structures segmentation and diagnosis: is the problem solved? IEEE TMI 37(11), 2514\u20132525 (2018)","journal-title":"IEEE TMI"},{"key":"61_CR4","doi-asserted-by":"crossref","unstructured":"Caron, M., et\u00a0al.: Emerging properties in self-supervised vision transformers. In: CVPR. pp. 9650\u20139660 (2021)","DOI":"10.1109\/ICCV48922.2021.00951"},{"issue":"7","key":"61_CR5","doi-asserted-by":"publisher","first-page":"901","DOI":"10.14219\/jada.archive.2001.0302","volume":"132","author":"N Chainani-Wu","year":"2001","unstructured":"Chainani-Wu, N., et\u00a0al.: Oral lichen planus: patient profile, disease progression and treatment responses. The Journal of the American Dental Association 132(7), 901\u2013909 (2001)","journal-title":"The Journal of the American Dental Association"},{"key":"61_CR6","unstructured":"Chen, T., Kornblith, S., Norouzi, M., Hinton, G.E.: A simple framework for contrastive learning of visual representations. CoRR abs\/2002.05709 (2020), https:\/\/arxiv.org\/abs\/2002.05709"},{"key":"61_CR7","unstructured":"Chen, T., et\u00a0al.: A simple framework for contrastive learning of visual representations. In: ICML. pp. 1597\u20131607. PMLR (2020)"},{"key":"61_CR8","doi-asserted-by":"crossref","unstructured":"Chen, X., et\u00a0al.: Exploring simple siamese representation learning. In: CVPR. pp. 15750\u201315758 (2021)","DOI":"10.1109\/CVPR46437.2021.01549"},{"key":"61_CR9","doi-asserted-by":"crossref","unstructured":"Couronn\u00e9, R., et\u00a0al.: Longitudinal self-supervision to disentangle inter-patient variability from disease progression. In: MICCAI. pp. 231\u2013241. Springer (2021)","DOI":"10.1007\/978-3-030-87196-3_22"},{"key":"61_CR10","volume":"219","author":"I Dave","year":"2022","unstructured":"Dave, I., et\u00a0al.: Tclr: Temporal contrastive learning for video representation. CVIU 219, 103406 (2022)","journal-title":"CVIU"},{"key":"61_CR11","unstructured":"Dosovitskiy, A., et\u00a0al.: An image is worth 16x16 words: Transformers for image recognition at scale. arXiv preprint arXiv:2010.11929 (2020)"},{"key":"61_CR12","doi-asserted-by":"crossref","unstructured":"Feichtenhofer, C., Fan, H., Malik, J., He, K.: Slowfast networks for video recognition. In: ICCV. pp. 6202\u20136211 (2019)","DOI":"10.1109\/ICCV.2019.00630"},{"key":"61_CR13","doi-asserted-by":"crossref","unstructured":"Feichtenhofer, C., et\u00a0al.: A large-scale study on unsupervised spatiotemporal representation learning. In: CVPR. pp. 3299\u20133309 (2021)","DOI":"10.1109\/CVPR46437.2021.00331"},{"issue":"1","key":"61_CR14","doi-asserted-by":"publisher","first-page":"58","DOI":"10.7150\/jca.7047","volume":"5","author":"LJ Graham","year":"2014","unstructured":"Graham, L.J., et\u00a0al.: Current approaches and challenges in monitoring treatment responses in breast cancer. Journal of Cancer 5(1), \u00a058 (2014)","journal-title":"Journal of Cancer"},{"key":"61_CR15","first-page":"21271","volume":"33","author":"JB Grill","year":"2020","unstructured":"Grill, J.B., et\u00a0al.: Bootstrap your own latent-a new approach to self-supervised learning. NeurIPS 33, 21271\u201321284 (2020)","journal-title":"NeurIPS"},{"key":"61_CR16","doi-asserted-by":"crossref","unstructured":"He, K., et\u00a0al.: Momentum contrast for unsupervised visual representation learning. In: CVPR. pp. 9729\u20139738 (2020)","DOI":"10.1109\/CVPR42600.2020.00975"},{"key":"61_CR17","first-page":"6840","volume":"33","author":"J Ho","year":"2020","unstructured":"Ho, J., Jain, A., Abbeel, P.: Denoising diffusion probabilistic models. Advances in neural information processing systems 33, 6840\u20136851 (2020)","journal-title":"Advances in neural information processing systems"},{"key":"61_CR18","doi-asserted-by":"crossref","unstructured":"Holland, R., et\u00a0al.: Clustering disease trajectories in contrastive feature space for biomarker proposal in age-related macular degeneration. In: MICCAI. pp. 724\u2013734. Springer (2023)","DOI":"10.1007\/978-3-031-43990-2_68"},{"key":"61_CR19","doi-asserted-by":"crossref","unstructured":"Jensen, A.B., et\u00a0al.: Temporal disease trajectories condensed from population-wide registry data covering 6.2 million patients. Nature communications 5(1), \u00a04022 (2014)","DOI":"10.1038\/ncomms5022"},{"key":"61_CR20","unstructured":"Kay, W., et\u00a0al.: The kinetics human action video dataset. arXiv preprint arXiv:1705.06950 (2017)"},{"issue":"1","key":"61_CR21","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1002\/pon.3022","volume":"22","author":"L Koch","year":"2013","unstructured":"Koch, L., et\u00a0al.: Fear of recurrence and disease progression in long-term ($$\\ge $$ 5 years) cancer survivors-a systematic review of quantitative studies. Psycho-oncology 22(1), 1\u201311 (2013)","journal-title":"Psycho-oncology"},{"issue":"1","key":"61_CR22","doi-asserted-by":"publisher","first-page":"371","DOI":"10.3390\/app11010371","volume":"11","author":"M Komatsu","year":"2021","unstructured":"Komatsu, M., et\u00a0al.: Detection of cardiac structural abnormalities in fetal ultrasound videos using deep learning. Applied Sciences 11(1), \u00a0371 (2021)","journal-title":"Applied Sciences"},{"key":"61_CR23","doi-asserted-by":"publisher","first-page":"41","DOI":"10.1016\/j.bspc.2018.08.007","volume":"47","author":"V Mond\u00e9jar-Guerra","year":"2019","unstructured":"Mond\u00e9jar-Guerra, V., et\u00a0al.: Heartbeat classification fusing temporal and morphological information of ecgs via ensemble of classifiers. Biomedical Signal Processing and Control 47, 41\u201348 (2019)","journal-title":"Biomedical Signal Processing and Control"},{"key":"61_CR24","doi-asserted-by":"crossref","unstructured":"Ouyang, J., et\u00a0al.: Self-supervised longitudinal neighbourhood embedding. In: MICCAI. pp. 80\u201389. Springer (2021)","DOI":"10.1007\/978-3-030-87196-3_8"},{"key":"61_CR25","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2022.102571","volume":"82","author":"J Ouyang","year":"2022","unstructured":"Ouyang, J., et\u00a0al.: Self-supervised learning of neighborhood embedding for longitudinal mri. Medical image analysis 82, 102571 (2022)","journal-title":"Medical image analysis"},{"key":"61_CR26","unstructured":"Park, J., et\u00a0al.: Probabilistic representations for video contrastive learning. In: CVPR. pp. 14711\u201314721 (2022)"},{"issue":"2","key":"61_CR27","doi-asserted-by":"publisher","first-page":"214","DOI":"10.1016\/j.ejrad.2008.06.031","volume":"68","author":"D Pugash","year":"2008","unstructured":"Pugash, D., et\u00a0al.: Prenatal ultrasound and fetal mri: the comparative value of each modality in prenatal diagnosis. European journal of radiology 68(2), 214\u2013226 (2008)","journal-title":"European journal of radiology"},{"key":"61_CR28","doi-asserted-by":"crossref","unstructured":"Qian, R., et\u00a0al.: Spatiotemporal contrastive video representation learning. In: CVPR. pp. 6964\u20136974 (2021)","DOI":"10.1109\/CVPR46437.2021.00689"},{"key":"61_CR29","first-page":"13541","volume":"35","author":"M Ren","year":"2022","unstructured":"Ren, M., et\u00a0al.: Local spatiotemporal representation learning for longitudinally-consistent neuroimage analysis. NeurIPS 35, 13541\u201313556 (2022)","journal-title":"NeurIPS"},{"issue":"4","key":"61_CR30","doi-asserted-by":"publisher","first-page":"537","DOI":"10.1016\/j.ophtha.2017.09.028","volume":"125","author":"SR Sadda","year":"2018","unstructured":"Sadda, S.R., et\u00a0al.: Consensus definition for atrophy associated with age-related macular degeneration on oct: classification of atrophy report 3. Ophthalmology 125(4), 537\u2013548 (2018)","journal-title":"Ophthalmology"},{"issue":"8","key":"61_CR31","doi-asserted-by":"publisher","first-page":"1930","DOI":"10.1109\/TPAMI.2012.277","volume":"35","author":"HC Shin","year":"2012","unstructured":"Shin, H.C., et\u00a0al.: Stacked autoencoders for unsupervised feature learning and multiple organ detection in a pilot study using 4d patient data. IEEE TPAMI 35(8), 1930\u20131943 (2012)","journal-title":"IEEE TPAMI"},{"issue":"3","key":"61_CR32","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pmed.1001779","volume":"12","author":"C Sudlow","year":"2015","unstructured":"Sudlow, C., et\u00a0al.: Uk biobank: an open access resource for identifying the causes of a wide range of complex diseases of middle and old age. PLoS medicine 12(3), e1001779 (2015)","journal-title":"PLoS medicine"},{"key":"61_CR33","unstructured":"Sutton, J., et\u00a0al.: Developing and validating a multivariable prediction model which predicts progression of intermediate to late age-related macular degeneration-the pinnacle trial protocol. Eye pp.\u00a01\u20139 (2022)"},{"key":"61_CR34","first-page":"10078","volume":"35","author":"Z Tong","year":"2022","unstructured":"Tong, Z., et\u00a0al.: Videomae: Masked autoencoders are data-efficient learners for self-supervised video pre-training. NeurIPS 35, 10078\u201310093 (2022)","journal-title":"NeurIPS"},{"key":"61_CR35","doi-asserted-by":"crossref","unstructured":"Wang, J., et\u00a0al.: Long-short temporal contrastive learning of video transformers. In: CVPR. pp. 14010\u201314020 (2022)","DOI":"10.1109\/CVPR52688.2022.01362"},{"key":"61_CR36","doi-asserted-by":"crossref","unstructured":"Wei, J., et\u00a0al.: Consistent segmentation of longitudinal brain mr images with spatio-temporal constrained networks. In: MICCAI. pp. 89\u201398. Springer (2021)","DOI":"10.1007\/978-3-030-87193-2_9"},{"key":"61_CR37","doi-asserted-by":"crossref","unstructured":"Yang, D., et\u00a0al.: Self-supervised video representation learning via latent time navigation. arXiv preprint arXiv:2305.06437 (2023)","DOI":"10.1609\/aaai.v37i3.25416"},{"key":"61_CR38","doi-asserted-by":"crossref","unstructured":"Zhang, H., et\u00a0al.: Modeling video as stochastic processes for fine-grained video representation learning. In: CVPR. pp. 2225\u20132234 (2023)","DOI":"10.1109\/CVPR52729.2023.00221"},{"key":"61_CR39","doi-asserted-by":"crossref","unstructured":"Zhao, Q., et\u00a0al.: Longitudinal correlation analysis for decoding multi-modal brain development. In: MICCAI. pp. 400\u2013409. Springer (2021)","DOI":"10.1007\/978-3-030-87234-2_38"},{"key":"61_CR40","doi-asserted-by":"crossref","unstructured":"Zhuang, C., et\u00a0al.: Unsupervised learning from video with deep neural embeddings. In: CVPR. pp. 9563\u20139572 (2020)","DOI":"10.1109\/CVPR42600.2020.00958"}],"container-title":["Lecture Notes in Computer Science","Medical Image Computing and Computer Assisted Intervention \u2013 MICCAI 2024"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-72120-5_61","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,10,2]],"date-time":"2024-10-02T12:29:29Z","timestamp":1727872169000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-72120-5_61"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024]]},"ISBN":["9783031721199","9783031721205"],"references-count":40,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-72120-5_61","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024]]},"assertion":[{"value":"3 October 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"The authors have no competing interests to declare that are relevant to the content of this article.","order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Disclosure of Interests"}},{"value":"MICCAI","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Medical Image Computing and Computer-Assisted Intervention","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Marrakesh","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Morocco","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"7 October 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"11 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"27","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"miccai2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/conferences.miccai.org\/2024\/en\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}