{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,16]],"date-time":"2025-06-16T14:40:02Z","timestamp":1750084802155,"version":"3.41.0"},"publisher-location":"Cham","reference-count":42,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319541808"},{"type":"electronic","value":"9783319541815"}],"license":[{"start":{"date-parts":[[2017,1,1]],"date-time":"2017-01-01T00:00:00Z","timestamp":1483228800000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2017]]},"DOI":"10.1007\/978-3-319-54181-5_11","type":"book-chapter","created":{"date-parts":[[2017,3,9]],"date-time":"2017-03-09T15:27:37Z","timestamp":1489073257000},"page":"163-179","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":8,"title":["Semi-supervised Domain Adaptation for Weakly Labeled Semantic Video Object Segmentation"],"prefix":"10.1007","author":[{"given":"Huiling","family":"Wang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tapani","family":"Raiko","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Lasse","family":"Lensu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tinghuai","family":"Wang","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Juha","family":"Karhunen","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2017,3,10]]},"reference":[{"key":"11_CR1","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"282","DOI":"10.1007\/978-3-642-15555-0_21","volume-title":"Computer Vision \u2013 ECCV 2010","author":"T Brox","year":"2010","unstructured":"Brox, T., Malik, J.: Object segmentation by long term analysis of point trajectories. In: Daniilidis, K., Maragos, P., Paragios, N. (eds.) ECCV 2010. LNCS, vol. 6315, pp. 282\u2013295. Springer, Heidelberg (2010). doi:10.1007\/978-3-642-15555-0_21"},{"key":"11_CR2","doi-asserted-by":"crossref","unstructured":"Lee, Y.J., Kim, J., Grauman, K.: Key-segments for video object segmentation. In: ICCV, pp. 1995\u20132002 (2011)","DOI":"10.1109\/ICCV.2011.6126471"},{"key":"11_CR3","doi-asserted-by":"crossref","unstructured":"Zhang, D., Javed, O., Shah, M.: Video object segmentation through spatially accurate and temporally dense extraction of primary object regions. In: CVPR, pp. 628\u2013635 (2013)","DOI":"10.1109\/CVPR.2013.87"},{"key":"11_CR4","doi-asserted-by":"crossref","unstructured":"Papazoglou, A., Ferrari, V.: Fast object segmentation in unconstrained video. In: ICCV, pp. 1777\u20131784 (2013)","DOI":"10.1109\/ICCV.2013.223"},{"key":"11_CR5","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"553","DOI":"10.1007\/978-3-319-16817-3_36","volume-title":"Computer Vision \u2013 ACCV 2014","author":"T Wang","year":"2015","unstructured":"Wang, T., Wang, H.: Graph transduction learning of object proposals for video object segmentation. In: Cremers, D., Reid, I., Saito, H., Yang, M.-H. (eds.) ACCV 2014. LNCS, vol. 9006, pp. 553\u2013568. Springer, Heidelberg (2015). doi:10.1007\/978-3-319-16817-3_36"},{"key":"11_CR6","doi-asserted-by":"publisher","first-page":"159","DOI":"10.1016\/j.cviu.2015.11.006","volume":"143","author":"H Wang","year":"2016","unstructured":"Wang, H., Wang, T.: Primary object discovery and segmentation in videos via graph-based transductive inference. Comput. Vis. Image Underst. 143, 159\u2013172 (2016)","journal-title":"Comput. Vis. Image Underst."},{"key":"11_CR7","unstructured":"Krizhevsky, A., Sutskever, I., Hinton, G.E.: Imagenet classification with deep convolutional neural networks. In: NIPS, pp. 1106\u20131114 (2012)"},{"key":"11_CR8","unstructured":"Simonyan, K., Zisserman, A.: Very deep convolutional networks for large-scale image recognition, arXiv preprint (2014). arXiv:1409.1556"},{"key":"11_CR9","unstructured":"Rasmus, A., Valpola, H., Honkala, M., Berglund, M., Raiko, T.: Semi-supervised learning with ladder network. In: NIPS (2015)"},{"key":"11_CR10","doi-asserted-by":"crossref","unstructured":"Faktor, A., Irani, M.: Video segmentation by non-local consensus voting. In: BMVC, vol. 2, p. 6 (2014)","DOI":"10.5244\/C.28.21"},{"key":"11_CR11","volume-title":"Discovering primary objects in videos by saliency fusion and iterative appearance estimation","author":"J Yang","year":"2015","unstructured":"Yang, J., Zhao, G., Yuan, J., Shen, X., Lin, Z., Price, B., Brandt, J.: Discovering primary objects in videos by saliency fusion and iterative appearance estimation. IEEE Trans. Circuits Syst, Video Technol (2015)"},{"key":"11_CR12","doi-asserted-by":"crossref","unstructured":"Perazzi, F., Wang, O., Gross, M., Sorkine-Hornung, A.: Fully connected object proposals for video segmentation. In: ICCV, pp. 3227\u20133234 (2015)","DOI":"10.1109\/ICCV.2015.369"},{"key":"11_CR13","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"575","DOI":"10.1007\/978-3-642-15555-0_42","volume-title":"Computer Vision \u2013 ECCV 2010","author":"I Endres","year":"2010","unstructured":"Endres, I., Hoiem, D.: Category independent object proposals. In: Daniilidis, K., Maragos, P., Paragios, N. (eds.) ECCV 2010. LNCS, vol. 6315, pp. 575\u2013588. Springer, Heidelberg (2010). doi:10.1007\/978-3-642-15555-0_42"},{"key":"11_CR14","doi-asserted-by":"crossref","unstructured":"Manen, S., Guillaumin, M., Gool, L.J.V.: Prime object proposals with randomized prim\u2019s algorithm. In: ICCV, pp. 2536\u20132543 (2013)","DOI":"10.1109\/ICCV.2013.315"},{"key":"11_CR15","doi-asserted-by":"publisher","first-page":"574","DOI":"10.1145\/1015706.1015763","volume":"23","author":"J Wang","year":"2004","unstructured":"Wang, J., Xu, Y., Shum, H.Y., Cohen, M.F.: Video tooning. ACM Trans. Graph. 23, 574\u2013583 (2004)","journal-title":"ACM Trans. Graph."},{"key":"11_CR16","doi-asserted-by":"publisher","first-page":"540","DOI":"10.1109\/TVCG.2005.85","volume":"11","author":"JP Collomosse","year":"2005","unstructured":"Collomosse, J.P., Rowntree, D., Hall, P.M.: Stroke surfaces: temporally coherent artistic animations from video. IEEE Trans. Vis. Comput. Graph. 11, 540\u2013549 (2005)","journal-title":"IEEE Trans. Vis. Comput. Graph."},{"key":"11_CR17","doi-asserted-by":"publisher","first-page":"389","DOI":"10.1109\/TMM.2011.2177078","volume":"14","author":"T Wang","year":"2012","unstructured":"Wang, T., Collomosse, J.P.: Probabilistic motion diffusion of labeling priors for coherent video segmentation. IEEE Trans. Multimed. 14, 389\u2013400 (2012)","journal-title":"IEEE Trans. Multimed."},{"key":"11_CR18","doi-asserted-by":"publisher","first-page":"190","DOI":"10.1007\/s11263-011-0512-5","volume":"100","author":"D Tsai","year":"2012","unstructured":"Tsai, D., Flagg, M., Nakazawa, A., Rehg, J.M.: Motion coherent tracking using multi-label MRF optimization. Int. J. Comput. Vis. 100, 190\u2013202 (2012)","journal-title":"Int. J. Comput. Vis."},{"key":"11_CR19","doi-asserted-by":"crossref","unstructured":"Li, F., Kim, T., Humayun, A., Tsai, D., Rehg, J.M.: Video segmentation by tracking many figure-ground segments. In: ICCV, Australia, 1\u20138 December 2013, pp. 2192\u20132199 (2013)","DOI":"10.1109\/ICCV.2013.273"},{"key":"11_CR20","doi-asserted-by":"publisher","first-page":"14","DOI":"10.1016\/j.cviu.2013.10.013","volume":"120","author":"T Wang","year":"2014","unstructured":"Wang, T., Han, B., Collomosse, J.P.: Touchcut: fast image and video segmentation using single-touch interaction. Comput. Vis. Image Underst. 120, 14\u201330 (2014)","journal-title":"Comput. Vis. Image Underst."},{"key":"11_CR21","doi-asserted-by":"crossref","unstructured":"Grundmann, M., Kwatra, V., Han, M., Essa, I.A.: Efficient hierarchical graph-based video segmentation. In: CVPR, pp. 2141\u20132148 (2010)","DOI":"10.1109\/CVPR.2010.5539893"},{"key":"11_CR22","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"626","DOI":"10.1007\/978-3-642-33783-3_45","volume-title":"Computer Vision \u2013 ECCV 2012","author":"C Xu","year":"2012","unstructured":"Xu, C., Xiong, C., Corso, J.J.: Streaming hierarchical video segmentation. In: Fitzgibbon, A., Lazebnik, S., Perona, P., Sato, Y., Schmid, C. (eds.) ECCV 2012. LNCS, vol. 7577, pp. 626\u2013639. Springer, Heidelberg (2012). doi:10.1007\/978-3-642-33783-3_45"},{"key":"11_CR23","doi-asserted-by":"crossref","unstructured":"Wang, C., de La Gorce, M., Paragios, N.: Segmentation, ordering and multi-object tracking using graphical models. In: ICCV, pp. 747\u2013754 (2009)","DOI":"10.1109\/ICCV.2009.5459247"},{"key":"11_CR24","doi-asserted-by":"crossref","unstructured":"Sundberg, P., Brox, T., Maire, M., Arbelaez, P., Malik, J.: Occlusion boundary detection and figure\/ground assignment from optical flow. In: CVPR, pp. 2233\u20132240 (2011)","DOI":"10.1109\/CVPR.2011.5995364"},{"key":"11_CR25","doi-asserted-by":"crossref","unstructured":"Giordano, D., Murabito, F., Palazzo, S., Spampinato, C.: Superpixel-based video object segmentation using perceptual organization and location prior. In: CVPR, pp. 4814\u20134822 (2015)","DOI":"10.1109\/CVPR.2015.7299114"},{"key":"11_CR26","doi-asserted-by":"crossref","unstructured":"Taylor, B., Karasev, V., Soatto, S.: Causal video object segmentation from persistence of occlusions. In: CVPR, pp. 4268\u20134276 (2015)","DOI":"10.1109\/CVPR.2015.7299055"},{"key":"11_CR27","doi-asserted-by":"crossref","unstructured":"Wang, W., Shen, J., Porikli, F.: Saliency-aware geodesic video object segmentation. In: CVPR, pp. 3395\u20133402 (2015)","DOI":"10.1109\/CVPR.2015.7298961"},{"key":"11_CR28","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"198","DOI":"10.1007\/978-3-642-33863-2_20","volume-title":"Computer Vision \u2013 ECCV 2012. Workshops and Demonstrations","author":"G Hartmann","year":"2012","unstructured":"Hartmann, G., Grundmann, M., Hoffman, J., Tsai, D., Kwatra, V., Madani, O., Vijayanarasimhan, S., Essa, I., Rehg, J., Sukthankar, R.: Weakly supervised learning of object segmentations from web-scale video. In: Fusiello, A., Murino, V., Cucchiara, R. (eds.) ECCV 2012. LNCS, vol. 7583, pp. 198\u2013208. Springer, Heidelberg (2012). doi:10.1007\/978-3-642-33863-2_20"},{"key":"11_CR29","doi-asserted-by":"crossref","unstructured":"Tang, K.D., Sukthankar, R., Yagnik, J., Li, F.: Discriminative segment annotation in weakly labeled video. In: CVPR, pp. 2483\u20132490 (2013)","DOI":"10.1109\/CVPR.2013.321"},{"key":"11_CR30","doi-asserted-by":"crossref","unstructured":"Liu, X., Tao, D., Song, M., Ruan, Y., Chen, C., Bu, J.: Weakly supervised multiclass video segmentation. In: CVPR, pp. 57\u201364 (2014)","DOI":"10.1109\/CVPR.2014.15"},{"key":"11_CR31","doi-asserted-by":"crossref","unstructured":"Zhang, Y., Chen, X., Li, J., Wang, C., Xia, C.: Semantic object segmentation via detection in weakly labeled video. In: CVPR, pp. 3641\u20133649 (2015)","DOI":"10.1109\/CVPR.2015.7298987"},{"key":"11_CR32","doi-asserted-by":"crossref","unstructured":"Girshick, R., Donahue, J., Darrell, T., Malik, J.: Rich feature hierarchies for accurate object detection and semantic segmentation. In: CVPR, pp. 580\u2013587 (2014)","DOI":"10.1109\/CVPR.2014.81"},{"key":"11_CR33","unstructured":"Zhou, D., Bousquet, O., Lal, T.N., Weston, J., Sch, B.: Learning with local and global consistency. In: NIPS, pp. 321\u2013328 (2004)"},{"key":"11_CR34","doi-asserted-by":"publisher","first-page":"309","DOI":"10.1145\/1015706.1015720","volume":"23","author":"C Rother","year":"2004","unstructured":"Rother, C., Kolmogorov, V., Blake, A.: \u201cGrabCut\u201d: interactive foreground extraction using iterated graph cuts. ACM Trans. Graph. 23, 309\u2013314 (2004)","journal-title":"ACM Trans. Graph."},{"key":"11_CR35","doi-asserted-by":"publisher","first-page":"1222","DOI":"10.1109\/34.969114","volume":"23","author":"Y Boykov","year":"2001","unstructured":"Boykov, Y., Veksler, O., Zabih, R.: Fast approximate energy minimization via graph cuts. IEEE Trans. Pattern Anal. Mach. Intell. 23, 1222\u20131239 (2001)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"11_CR36","doi-asserted-by":"crossref","unstructured":"Jia, Y., Shelhamer, E., Donahue, J., Karayev, S., Long, J., Girshick, R., Guadarrama, S., Darrell, T.: Caffe: convolutional architecture for fast feature embedding. In: Proceedings of the ACM International Conference on Multimedia, pp. 675\u2013678. ACM (2014)","DOI":"10.1145\/2647868.2654889"},{"key":"11_CR37","doi-asserted-by":"crossref","unstructured":"Arbelaez, P., Maire, M., Fowlkes, C.C., Malik, J.: From contours to regions: an empirical evaluation. In: CVPR, pp. 2294\u20132301 (2009)","DOI":"10.1109\/CVPRW.2009.5206707"},{"key":"11_CR38","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"25","DOI":"10.1007\/978-3-540-24673-2_3","volume-title":"Computer Vision - ECCV 2004","author":"T Brox","year":"2004","unstructured":"Brox, T., Bruhn, A., Papenberg, N., Weickert, J.: High accuracy optical flow estimation based on a theory for warping. In: Pajdla, T., Matas, J. (eds.) ECCV 2004. LNCS, vol. 3024, pp. 25\u201336. Springer, Heidelberg (2004). doi:10.1007\/978-3-540-24673-2_3"},{"key":"11_CR39","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"282","DOI":"10.1007\/978-3-642-15555-0_21","volume-title":"Computer Vision \u2013 ECCV 2010","author":"T Brox","year":"2010","unstructured":"Brox, T., Malik, J.: Object segmentation by long term analysis of point trajectories. In: Daniilidis, K., Maragos, P., Paragios, N. (eds.) ECCV 2010. LNCS, vol. 6315, pp. 282\u2013295. Springer, Heidelberg (2010). doi:10.1007\/978-3-642-15555-0_21"},{"key":"11_CR40","doi-asserted-by":"crossref","unstructured":"Prest, A., Leistner, C., Civera, J., Schmid, C., Ferrari, V.: Learning object class detectors from weakly annotated video. In: CVPR, pp. 3282\u20133289 (2012)","DOI":"10.1109\/CVPR.2012.6248065"},{"key":"11_CR41","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"656","DOI":"10.1007\/978-3-319-10593-2_43","volume-title":"Computer Vision \u2013 ECCV 2014","author":"SD Jain","year":"2014","unstructured":"Jain, S.D., Grauman, K.: Supervoxel-consistent foreground propagation in video. In: Fleet, D., Pajdla, T., Schiele, B., Tuytelaars, T. (eds.) ECCV 2014. LNCS, vol. 8692, pp. 656\u2013671. Springer, Heidelberg (2014). doi:10.1007\/978-3-319-10593-2_43"},{"key":"11_CR42","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"640","DOI":"10.1007\/978-3-319-10593-2_42","volume-title":"Computer Vision \u2013 ECCV 2014","author":"L Wang","year":"2014","unstructured":"Wang, L., Hua, G., Sukthankar, R., Xue, J., Zheng, N.: Video object discovery and co-segmentation with extremely weak supervision. In: Fleet, D., Pajdla, T., Schiele, B., Tuytelaars, T. (eds.) ECCV 2014. LNCS, vol. 8692, pp. 640\u2013655. Springer, Heidelberg (2014). doi:10.1007\/978-3-319-10593-2_42"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ACCV 2016"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-54181-5_11","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,16]],"date-time":"2025-06-16T14:22:14Z","timestamp":1750083734000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-319-54181-5_11"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017]]},"ISBN":["9783319541808","9783319541815"],"references-count":42,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-54181-5_11","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2017]]},"assertion":[{"value":"10 March 2017","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ACCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Asian Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Taipei","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Taiwan","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2016","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"20 November 2016","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"24 November 2016","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"13","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"accv2016","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.accv2016.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}