{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,10]],"date-time":"2026-04-10T01:25:14Z","timestamp":1775784314737,"version":"3.50.1"},"publisher-location":"Cham","reference-count":29,"publisher":"Springer International Publishing","isbn-type":[{"value":"9783030872014","type":"print"},{"value":"9783030872021","type":"electronic"}],"license":[{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"},{"start":{"date-parts":[[2021,1,1]],"date-time":"2021-01-01T00:00:00Z","timestamp":1609459200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021]]},"DOI":"10.1007\/978-3-030-87202-1_49","type":"book-chapter","created":{"date-parts":[[2021,9,22]],"date-time":"2021-09-22T19:03:23Z","timestamp":1632337403000},"page":"509-518","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":21,"title":["Effective Semantic Segmentation in Cataract Surgery: What Matters Most?"],"prefix":"10.1007","author":[{"given":"Theodoros","family":"Pissas","sequence":"first","affiliation":[]},{"given":"Claudio S.","family":"Ravasio","sequence":"additional","affiliation":[]},{"given":"Lyndon","family":"Da Cruz","sequence":"additional","affiliation":[]},{"given":"Christos","family":"Bergeles","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2021,9,21]]},"reference":[{"key":"49_CR1","unstructured":"Blindness and vision impairment. https:\/\/www.who.int\/news-room\/fact-sheets\/detail\/blindness-and-visual-impairment. Accessed 1 Mar 2021"},{"key":"49_CR2","doi-asserted-by":"publisher","first-page":"24","DOI":"10.1016\/j.media.2018.11.008","volume":"52","author":"H Al Hajj","year":"2019","unstructured":"Al Hajj, H., et al.: Cataracts: challenge on automatic tool annotation for cataract surgery. Med. Image Anal. 52, 24\u201341 (2019)","journal-title":"Med. Image Anal."},{"key":"49_CR3","series-title":"Communications in Computer and Information Science","doi-asserted-by":"publisher","first-page":"277","DOI":"10.1007\/978-3-319-95921-4_26","volume-title":"Medical Image Understanding and Analysis","author":"L Berger","year":"2018","unstructured":"Berger, L., Eoin, H., Cardoso, M.J., Ourselin, S.: An adaptive sampling scheme to efficiently train fully convolutional networks for semantic segmentation. In: Nixon, M., Mahmoodi, S., Zwiggelaar, R. (eds.) MIUA 2018. CCIS, vol. 894, pp. 277\u2013286. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-319-95921-4_26"},{"key":"49_CR4","doi-asserted-by":"crossref","unstructured":"Berman, M., Triki, A.R., Blaschko, M.B.: The lov\u00e1sz-softmax loss: a tractable surrogate for the optimization of the intersection-over-union measure in neural networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4413\u20134421 (2018)","DOI":"10.1109\/CVPR.2018.00464"},{"key":"49_CR5","doi-asserted-by":"crossref","unstructured":"Chen, L.C., Zhu, Y., Papandreou, G., Schroff, F., Adam, H.: Encoder-decoder with atrous separable convolution for semantic image segmentation. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 801\u2013818 (2018)","DOI":"10.1007\/978-3-030-01234-2_49"},{"key":"49_CR6","unstructured":"Chen, X., Fan, H., Girshick, R., He, K.: Improved baselines with momentum contrastive learning. arXiv preprint arXiv:2003.04297 (2020)"},{"key":"49_CR7","doi-asserted-by":"crossref","unstructured":"Fox, M., Taschwer, M., Schoeffmann, K.: Pixel-based tool segmentation in cataract surgery videos with mask R-CNN. In: 2020 IEEE 33rd International Symposium on Computer-Based Medical Systems (CBMS), pp. 565\u2013568. IEEE (2020)","DOI":"10.1109\/CBMS49503.2020.00112"},{"key":"49_CR8","doi-asserted-by":"publisher","unstructured":"Grammatikopoulou, M., et al.: Cadis: cataract dataset for surgical RGB-image segmentation. Med. Image Anal. 71,(2021). https:\/\/doi.org\/10.1016\/j.media.2021.102053","DOI":"10.1016\/j.media.2021.102053"},{"key":"49_CR9","doi-asserted-by":"crossref","unstructured":"Gupta, A., Dollar, P., Girshick, R.: LVIS: a dataset for large vocabulary instance segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 5356\u20135364 (2019)","DOI":"10.1109\/CVPR.2019.00550"},{"key":"49_CR10","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 770\u2013778 (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"49_CR11","unstructured":"Karpathy, A.: A recipe for training neural networks (2019). http:\/\/karpathy.github.io\/2019\/04\/25\/recipe\/"},{"key":"49_CR12","unstructured":"Kingma, D.P., Ba, J.: Adam: a method for stochastic optimization. In: Bengio, Y., LeCun, Y. (eds.) 3rd International Conference on Learning Representations, ICLR 2015 (2015)"},{"key":"49_CR13","unstructured":"Maier-Hein, L., et al.: Surgical data science-from concepts to clinical translation. arXiv preprint arXiv:2011.02284 (2020)"},{"key":"49_CR14","doi-asserted-by":"crossref","unstructured":"Marcel, S., Rodriguez, Y.: Torchvision the machine-vision package of torch. In: Proceedings of the 18th ACM international conference on Multimedia, pp. 1485\u20131488 (2010)","DOI":"10.1145\/1873951.1874254"},{"key":"49_CR15","doi-asserted-by":"crossref","unstructured":"Mishra, P., Sarawadekar, K.: Polynomial learning rate policy with warm restart for deep neural network. In: TENCON 2019\u20132019 IEEE Region 10 Conference (TENCON), pp. 2087\u20132092. IEEE (2019)","DOI":"10.1109\/TENCON.2019.8929465"},{"issue":"1","key":"49_CR16","doi-asserted-by":"crossref","first-page":"1","DOI":"10.1038\/s41598-018-37186-2","volume":"9","author":"S Morita","year":"2019","unstructured":"Morita, S., Tabuchi, H., Masumoto, H., Yamauchi, T., Kamiura, N.: Real-time extraction of important surgical phases in cataract surgery videos. Sci. Rep. 9(1), 1\u20138 (2019)","journal-title":"Sci. Rep."},{"key":"49_CR17","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"139","DOI":"10.1007\/978-3-030-36711-4_13","volume-title":"Neural Information Processing","author":"Z-L Ni","year":"2019","unstructured":"Ni, Z.-L., et al.: RAUNet: residual attention U-Net for semantic segmentation of cataract surgical instruments. In: Gedeon, T., Wong, K.W., Lee, M. (eds.) ICONIP 2019. LNCS, vol. 11954, pp. 139\u2013149. Springer, Cham (2019). https:\/\/doi.org\/10.1007\/978-3-030-36711-4_13"},{"issue":"3","key":"49_CR18","doi-asserted-by":"publisher","first-page":"632","DOI":"10.1016\/j.media.2010.10.001","volume":"16","author":"N Padoy","year":"2012","unstructured":"Padoy, N., Blum, T., Ahmadi, S.A., Feussner, H., Berger, M.O., Navab, N.: Statistical modeling and recognition of surgical workflow. Med. Image Anal. 16(3), 632\u2013641 (2012)","journal-title":"Med. Image Anal."},{"key":"49_CR19","doi-asserted-by":"crossref","unstructured":"Shrivastava, A., Gupta, A., Girshick, R.: Training region-based object detectors with online hard example mining. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR), June 2016","DOI":"10.1109\/CVPR.2016.89"},{"key":"49_CR20","doi-asserted-by":"crossref","unstructured":"Sun, K., Xiao, B., Liu, D., Wang, J.: Deep high-resolution representation learning for human pose estimation. In: CVPR (2019)","DOI":"10.1109\/CVPR.2019.00584"},{"issue":"14","key":"49_CR21","doi-asserted-by":"publisher","first-page":"5872","DOI":"10.1167\/iovs.16-19894","volume":"57","author":"W Wang","year":"2016","unstructured":"Wang, W., Yan, W., Fotis, K., Prasad, N.M., Lansingh, V.C., Taylor, H.R., Finger, R.P., Facciolo, D., He, M.: Cataract surgical rate and socioeconomics: a global study. Invest. Ophthalmol. Vis. Sci. 57(14), 5872\u20135881 (2016)","journal-title":"Invest. Ophthalmol. Vis. Sci."},{"key":"49_CR22","doi-asserted-by":"crossref","unstructured":"Xiao, T., Liu, Y., Zhou, B., Jiang, Y., Sun, J.: Unified perceptual parsing for scene understanding. In: Proceedings of the European Conference on Computer Vision (ECCV), pp. 418\u2013434 (2018)","DOI":"10.1007\/978-3-030-01228-1_26"},{"key":"49_CR23","doi-asserted-by":"crossref","unstructured":"Xie, S., Girshick, R., Doll\u00e1r, P., Tu, Z., He, K.: Aggregated residual transformations for deep neural networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 1492\u20131500 (2017)","DOI":"10.1109\/CVPR.2017.634"},{"issue":"4","key":"49_CR24","doi-asserted-by":"publisher","first-page":"e191860","DOI":"10.1001\/jamanetworkopen.2019.1860","volume":"2","author":"F Yu","year":"2019","unstructured":"Yu, F., et al.: Assessment of automated identification of phases in videos of cataract surgery using machine learning and deep learning techniques. JAMA Netw. Open 2(4), e191860\u2013e191860 (2019)","journal-title":"JAMA Netw. Open"},{"key":"49_CR25","unstructured":"Yuan, Y., Chen, X., Wang, J.: Object-contextual representations for semantic segmentation. arXiv preprint arXiv:1909.11065 (2019)"},{"key":"49_CR26","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"56","DOI":"10.1007\/978-3-030-32254-0_7","volume-title":"Medical Image Computing and Computer Assisted Intervention \u2013 MICCAI 2019","author":"D Zang","year":"2019","unstructured":"Zang, D., Bian, G.-B., Wang, Y., Li, Z.: An extremely fast and precise convolutional neural network for recognition and localization of cataract surgical tools. In: Shen, D., et al. (eds.) MICCAI 2019. LNCS, vol. 11768, pp. 56\u201364. Springer, Cham (2019). https:\/\/doi.org\/10.1007\/978-3-030-32254-0_7"},{"key":"49_CR27","doi-asserted-by":"crossref","unstructured":"Zhou, B., Zhao, H., Puig, X., Fidler, S., Barriuso, A., Torralba, A.: Scene parsing through ade20k dataset. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (2017)","DOI":"10.1109\/CVPR.2017.544"},{"key":"49_CR28","doi-asserted-by":"publisher","first-page":"302","DOI":"10.1007\/s11263-018-1140-0","volume":"127","author":"B Zhou","year":"2018","unstructured":"Zhou, B., et al.: Semantic understanding of scenes through the ade20k dataset. Int. J. Comput. Vis. 127, 302\u2013321 (2018)","journal-title":"Int. J. Comput. Vis."},{"key":"49_CR29","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"265","DOI":"10.1007\/978-3-030-00937-3_31","volume-title":"Medical Image Computing and Computer Assisted Intervention \u2013 MICCAI 2018","author":"O Zisimopoulos","year":"2018","unstructured":"Zisimopoulos, O., et al.: DeepPhase: surgical phase recognition in CATARACTS videos. In: Frangi, A.F., Schnabel, J.A., Davatzikos, C., Alberola-L\u00f3pez, C., Fichtinger, G. (eds.) MICCAI 2018. LNCS, vol. 11073, pp. 265\u2013272. Springer, Cham (2018). https:\/\/doi.org\/10.1007\/978-3-030-00937-3_31"}],"container-title":["Lecture Notes in Computer Science","Medical Image Computing and Computer Assisted Intervention \u2013 MICCAI 2021"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-030-87202-1_49","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,1,9]],"date-time":"2023-01-09T23:14:04Z","timestamp":1673306044000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-030-87202-1_49"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021]]},"ISBN":["9783030872014","9783030872021"],"references-count":29,"URL":"https:\/\/doi.org\/10.1007\/978-3-030-87202-1_49","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"value":"0302-9743","type":"print"},{"value":"1611-3349","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021]]},"assertion":[{"value":"21 September 2021","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"MICCAI","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Medical Image Computing and Computer-Assisted Intervention","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Strasbourg","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"France","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2021","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"27 September 2021","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"1 October 2021","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"24","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"miccai2021","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/miccai2021.org\/en\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Microsoft CMT","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"1622","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"531","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"33% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"4","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"The conference was held virtually.","order":10,"name":"additional_info_on_review_process","label":"Additional Info on Review Process","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}