{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,1]],"date-time":"2026-05-01T16:58:05Z","timestamp":1777654685240,"version":"3.51.4"},"publisher-location":"Cham","reference-count":34,"publisher":"Springer Nature Switzerland","isbn-type":[{"value":"9783031439032","type":"print"},{"value":"9783031439049","type":"electronic"}],"license":[{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023]]},"DOI":"10.1007\/978-3-031-43904-9_55","type":"book-chapter","created":{"date-parts":[[2023,9,30]],"date-time":"2023-09-30T23:08:57Z","timestamp":1696115337000},"page":"569-578","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":23,"title":["Self-supervised Learning for\u00a0Endoscopic Video Analysis"],"prefix":"10.1007","author":[{"given":"Roy","family":"Hirsch","sequence":"first","affiliation":[]},{"given":"Mathilde","family":"Caron","sequence":"additional","affiliation":[]},{"given":"Regev","family":"Cohen","sequence":"additional","affiliation":[]},{"given":"Amir","family":"Livne","sequence":"additional","affiliation":[]},{"given":"Ron","family":"Shapiro","sequence":"additional","affiliation":[]},{"given":"Tomer","family":"Golany","sequence":"additional","affiliation":[]},{"given":"Roman","family":"Goldenberg","sequence":"additional","affiliation":[]},{"given":"Daniel","family":"Freedman","sequence":"additional","affiliation":[]},{"given":"Ehud","family":"Rivlin","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,10,1]]},"reference":[{"issue":"2","key":"55_CR1","first-page":"114","volume":"36","author":"G Antonelli","year":"2023","unstructured":"Antonelli, G., Rizkala, T., Iacopini, F., Hassan, C.: Current and future implications of artificial intelligence in colonoscopy. Ann. Gastroenterol. 36(2), 114\u2013122 (2023)","journal-title":"Ann. Gastroenterol."},{"key":"55_CR2","doi-asserted-by":"publisher","unstructured":"Assran, M., et al.: Masked siamese networks for label-efficient learning. In: ECCV (2022). https:\/\/doi.org\/10.1007\/978-3-031-19821-2_26","DOI":"10.1007\/978-3-031-19821-2_26"},{"issue":"6","key":"55_CR3","doi-asserted-by":"publisher","first-page":"1460","DOI":"10.1053\/j.gastro.2017.10.026","volume":"153","author":"MF Byrne","year":"2017","unstructured":"Byrne, M.F., Shahidi, N., Rex, D.K.: Will computer-aided detection and diagnosis revolutionize colonoscopy? Gastroenterology 153(6), 1460\u20131464 (2017)","journal-title":"Gastroenterology"},{"key":"55_CR4","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"139","DOI":"10.1007\/978-3-030-01264-9_9","volume-title":"Computer Vision \u2013 ECCV 2018","author":"M Caron","year":"2018","unstructured":"Caron, M., Bojanowski, P., Joulin, A., Douze, M.: Deep clustering for unsupervised learning of visual features. In: Ferrari, V., Hebert, M., Sminchisescu, C., Weiss, Y. (eds.) Computer Vision \u2013 ECCV 2018. LNCS, vol. 11218, pp. 139\u2013156. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-030-01264-9_9"},{"key":"55_CR5","unstructured":"Caron, M., Misra, I., Mairal, J., Goyal, P., Bojanowski, P., Joulin, A.: Unsupervised learning of visual features by contrasting cluster assignments. In: NeurIPS (2020)"},{"key":"55_CR6","doi-asserted-by":"crossref","unstructured":"Caron, M., et al.: Emerging properties in self-supervised vision transformers. In: ICCV (2021)","DOI":"10.1109\/ICCV48922.2021.00951"},{"key":"55_CR7","unstructured":"Chen, T., Kornblith, S., Norouzi, M., Hinton, G.: A simple framework for contrastive learning of visual representations. In: ICML (2020)"},{"key":"55_CR8","doi-asserted-by":"crossref","unstructured":"Chen, X., He, K.: Exploring simple siamese representation learning. In: CVPR (2021)","DOI":"10.1109\/CVPR46437.2021.01549"},{"key":"55_CR9","doi-asserted-by":"crossref","unstructured":"Chen, X., Xie, S., He, K.: An empirical study of training self-supervised vision transformers. In: ICCV (2021)","DOI":"10.1109\/ICCV48922.2021.00950"},{"key":"55_CR10","first-page":"18152","volume":"34","author":"R Cohen","year":"2021","unstructured":"Cohen, R., Blau, Y., Freedman, D., Rivlin, E.: It has potential: gradient-driven denoisers for convergent solutions to inverse problems. Adv. Neural. Inf. Process. Syst. 34, 18152\u201318164 (2021)","journal-title":"Adv. Neural. Inf. Process. Syst."},{"issue":"3","key":"55_CR11","doi-asserted-by":"publisher","first-page":"1374","DOI":"10.1137\/20M1337168","volume":"14","author":"R Cohen","year":"2021","unstructured":"Cohen, R., Elad, M., Milanfar, P.: Regularization by denoising via fixed-point projection (RED-PRO). SIAM J. Imag. Sci. 14(3), 1374\u20131406 (2021)","journal-title":"SIAM J. Imag. Sci."},{"key":"55_CR12","doi-asserted-by":"crossref","unstructured":"da Costa Rocha, C., Padoy, N., Rosa, B.: Self-supervised surgical tool segmentation using kinematic information. In: 2019 International Conference on Robotics and Automation (ICRA), pp. 8720\u20138726. IEEE (2019)","DOI":"10.1109\/ICRA.2019.8794334"},{"key":"55_CR13","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"343","DOI":"10.1007\/978-3-030-59716-0_33","volume-title":"Medical Image Computing and Computer Assisted Intervention \u2013 MICCAI 2020","author":"T Czempiel","year":"2020","unstructured":"Czempiel, T., et al.: TeCNO: surgical phase recognition with multi-stage temporal convolutional networks. In: Martel, A.L., et al. (eds.) MICCAI 2020. LNCS, vol. 12263, pp. 343\u2013352. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-59716-0_33"},{"key":"55_CR14","doi-asserted-by":"crossref","unstructured":"Dayyeh, B.K.A., et al.: Asge technology committee systematic review and meta-analysis assessing the asge pivi thresholds for adopting real-time endoscopic assessment of the histology of diminutive colorectal polyps. Gastrointest. Endosc. 81(3), 502.e1\u2013502.e16 (2015)","DOI":"10.1016\/j.gie.2014.12.022"},{"key":"55_CR15","doi-asserted-by":"crossref","unstructured":"Dehghani, M., Gritsenko, A., Arnab, A., Minderer, M., Tay, Y.: Scenic: a jax library for computer vision research and beyond. In: CVPR, pp. 21393\u201321398 (2022)","DOI":"10.1109\/CVPR52688.2022.02070"},{"key":"55_CR16","unstructured":"Dosovitskiy, A., et al.: An image is worth 16x16 words: transformers for image recognition at scale. arXiv preprint arXiv:2010.11929 (2020)"},{"key":"55_CR17","unstructured":"Golany, T., et al.: AI for phase recognition in complex laparoscopic cholecystectomy. Surgical Endoscopy, 1\u20139 (2022)"},{"key":"55_CR18","doi-asserted-by":"publisher","unstructured":"Goldbraikh, A., Avisdris, N., Pugh, C.M., Laufer, S.: Bounded future MS-TCN++ for surgical gesture recognition. In: ECCV 2022 Workshops, October 23\u201327, 2022, Proceedings, Part III, pp. 406\u2013421. Springer (2023). https:\/\/doi.org\/10.1007\/978-3-031-25066-8_22","DOI":"10.1007\/978-3-031-25066-8_22"},{"issue":"1","key":"55_CR19","doi-asserted-by":"publisher","first-page":"77","DOI":"10.1016\/j.gie.2020.06.059","volume":"93","author":"C Hassan","year":"2021","unstructured":"Hassan, C., et al.: Performance of artificial intelligence in colonoscopy for adenoma and polyp detection: a systematic review and meta-analysis. Gastrointest. Endosc. 93(1), 77\u201385 (2021)","journal-title":"Gastrointest. Endosc."},{"key":"55_CR20","doi-asserted-by":"crossref","unstructured":"He, K., Chen, X., Xie, S., Li, Y., Doll\u00e1r, P., Girshick, R.: Masked autoencoders are scalable vision learners. In: CVPR (2022)","DOI":"10.1109\/CVPR52688.2022.01553"},{"key":"55_CR21","doi-asserted-by":"crossref","unstructured":"Intrator, Y., Aizenberg, N., Livne, A., Rivlin, E., Goldenberg, R.: Self-supervised polyp re-identification in colonoscopy. arXiv preprint arXiv:2306.08591 (2023)","DOI":"10.1007\/978-3-031-43904-9_57"},{"key":"55_CR22","unstructured":"Joulin, A., Bach, F.: A convex relaxation for weakly supervised classifiers. arXiv preprint arXiv:1206.6413 (2012)"},{"key":"55_CR23","doi-asserted-by":"publisher","unstructured":"Katzir, L., et al.: Estimating withdrawal time in colonoscopies. In: ECCV, pp. 495\u2013512. Springer (2022). https:\/\/doi.org\/10.1007\/978-3-031-25066-8_28","DOI":"10.1007\/978-3-031-25066-8_28"},{"key":"55_CR24","doi-asserted-by":"crossref","unstructured":"Kutiel, G., Cohen, R., Elad, M., Freedman, D., Rivlin, E.: Conformal prediction masks: visualizing uncertainty in medical imaging. In: ICLR 2023 Workshop on Trustworthy Machine Learning for Healthcare (2023)","DOI":"10.1007\/978-3-031-39539-0_14"},{"issue":"6","key":"55_CR25","doi-asserted-by":"publisher","first-page":"1099","DOI":"10.1016\/j.gie.2021.06.021","volume":"94","author":"DM Livovsky","year":"2021","unstructured":"Livovsky, D.M., et al.: Detection of elusive polyps using a large-scale artificial intelligence system (with videos). Gastrointest. Endosc. 94(6), 1099\u20131109 (2021)","journal-title":"Gastrointest. Endosc."},{"key":"55_CR26","doi-asserted-by":"crossref","unstructured":"Ou, S., Gao, Y., Zhang, Z., Shi, C.: Polyp-YOLOv5-Tiny: a lightweight model for real-time polyp detection. In: International Conference on Information Technology, Big Data and Artificial Intelligence (ICIBA), vol. 2, pp. 1106\u20131111 (2021","DOI":"10.1109\/ICIBA52610.2021.9688145"},{"key":"55_CR27","doi-asserted-by":"publisher","DOI":"10.1016\/j.media.2023.102844","volume":"88","author":"S Ramesh","year":"2023","unstructured":"Ramesh, S., et al.: Dissecting self-supervised learning methods for surgical computer vision. Med. Image Anal. 88, 102844 (2023)","journal-title":"Med. Image Anal."},{"key":"55_CR28","doi-asserted-by":"publisher","first-page":"925","DOI":"10.1007\/s11548-018-1772-0","volume":"13","author":"T Ross","year":"2018","unstructured":"Ross, T., et al.: Exploiting the potential of unlabeled endoscopic video data with self-supervised learning. Int. J. Comput. Assist. Radiol. Surg. 13, 925\u2013933 (2018)","journal-title":"Int. J. Comput. Assist. Radiol. Surg."},{"key":"55_CR29","doi-asserted-by":"crossref","unstructured":"Russakovsky, O., et al.: Imagenet large scale visual recognition challenge. In: IJCV (2015)","DOI":"10.1007\/s11263-015-0816-y"},{"issue":"2","key":"55_CR30","doi-asserted-by":"publisher","first-page":"2938","DOI":"10.1109\/LRA.2021.3062308","volume":"6","author":"L Sestini","year":"2021","unstructured":"Sestini, L., Rosa, B., De Momi, E., Ferrigno, G., Padoy, N.: A kinematic bottleneck approach for pose regression of flexible surgical instruments directly from images. IEEE Robotics Autom. Lett. 6(2), 2938\u20132945 (2021)","journal-title":"IEEE Robotics Autom. Lett."},{"key":"55_CR31","doi-asserted-by":"crossref","unstructured":"Touvron, H., Cord, M., J\u00e9gou, H.: DeIT III: Revenge of the ViT. arXiv preprint arXiv:2204.07118 (2022)","DOI":"10.1007\/978-3-031-20053-3_30"},{"issue":"1","key":"55_CR32","doi-asserted-by":"publisher","first-page":"86","DOI":"10.1109\/TMI.2016.2593957","volume":"36","author":"AP Twinanda","year":"2016","unstructured":"Twinanda, A.P., Shehata, S., Mutter, D., Marescaux, J., De Mathelin, M., Padoy, N.: Endonet: a deep architecture for recognition tasks on laparoscopic videos. IEEE Trans. Med. Imaging 36(1), 86\u201397 (2016)","journal-title":"IEEE Trans. Med. Imaging"},{"key":"55_CR33","doi-asserted-by":"publisher","DOI":"10.7910\/DVN\/FCBUOR","author":"G Wang","year":"2021","unstructured":"Wang, G.: Replication data for: colonoscopy polyp detection and classification: dataset creation and comparative evaluations. Harvard Dataverse (2021). https:\/\/doi.org\/10.7910\/DVN\/FCBUOR","journal-title":"Harvard Dataverse"},{"key":"55_CR34","unstructured":"Zhou, J., et al.: ibot: image bert pre-training with online tokenizer. arXiv preprint arXiv:2111.07832 (2021)"}],"container-title":["Lecture Notes in Computer Science","Medical Image Computing and Computer Assisted Intervention \u2013 MICCAI 2023"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-43904-9_55","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,11]],"date-time":"2024-03-11T14:41:29Z","timestamp":1710168089000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-43904-9_55"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023]]},"ISBN":["9783031439032","9783031439049"],"references-count":34,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-43904-9_55","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2023]]},"assertion":[{"value":"1 October 2023","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"MICCAI","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Medical Image Computing and Computer-Assisted Intervention","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Vancouver, BC","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Canada","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2023","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"8 October 2023","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"12 October 2023","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"miccai2023","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/conferences.miccai.org\/2023\/en\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"CMT","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"2250","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"730","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"32% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"5","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}