{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,26]],"date-time":"2025-03-26T20:57:25Z","timestamp":1743022645953,"version":"3.40.3"},"publisher-location":"Cham","reference-count":34,"publisher":"Springer International Publishing","isbn-type":[{"type":"print","value":"9783319541808"},{"type":"electronic","value":"9783319541815"}],"license":[{"start":{"date-parts":[[2017,1,1]],"date-time":"2017-01-01T00:00:00Z","timestamp":1483228800000},"content-version":"unspecified","delay-in-days":0,"URL":"http:\/\/www.springer.com\/tdm"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2017]]},"DOI":"10.1007\/978-3-319-54181-5_8","type":"book-chapter","created":{"date-parts":[[2017,3,9]],"date-time":"2017-03-09T15:27:37Z","timestamp":1489073257000},"page":"121-136","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Learning to Generate Object Segment Proposals with Multi-modal Cues"],"prefix":"10.1007","author":[{"given":"Haoyang","family":"Zhang","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xuming","family":"He","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Fatih","family":"Porikli","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2017,3,10]]},"reference":[{"key":"8_CR1","doi-asserted-by":"crossref","unstructured":"Girshick, R., Donahue, J., Darrell, T., Malik, J.: Region-based convolutional networks for accurate object detection and segmentation. IEEE Trans. Pattern Anal. Mach. Intell. 38(1), 142\u2013158 (2015)","DOI":"10.1109\/TPAMI.2015.2437384"},{"key":"8_CR2","doi-asserted-by":"crossref","unstructured":"Girshick, R.B.: Fast R-CNN. CoRR abs\/1504.08083 (2015)","DOI":"10.1109\/ICCV.2015.169"},{"key":"8_CR3","unstructured":"Ren, S., He, K., Girshick, R., Sun, J.: Faster R-CNN: Towards real-time object detection with region proposal networks. In: Advances in Neural Information Processing Systems, pp. 91\u201399 (2015)"},{"key":"8_CR4","doi-asserted-by":"crossref","unstructured":"Alexe, B., Deselaers, T., Ferrari, V.: What is an object? In: 2010 IEEE Conference on Computer Vision and Pattern Recognition (CVPR), pp. 73\u201380. IEEE (2010)","DOI":"10.1109\/CVPR.2010.5540226"},{"key":"8_CR5","doi-asserted-by":"publisher","first-page":"154","DOI":"10.1007\/s11263-013-0620-5","volume":"104","author":"JR Uijlings","year":"2013","unstructured":"Uijlings, J.R., van de Sande, K.E., Gevers, T., Smeulders, A.W.: Selective search for object recognition. Intl. J. Comput. Vis. 104, 154\u2013171 (2013)","journal-title":"Intl. J. Comput. Vis."},{"key":"8_CR6","doi-asserted-by":"crossref","unstructured":"Cheng, M.M., Zhang, Z., Lin, W.Y., Torr, P.: Bing: Binarized normed gradients for objectness estimation at 300fps. In: IEEE CVPR (2014)","DOI":"10.1109\/CVPR.2014.414"},{"key":"8_CR7","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"391","DOI":"10.1007\/978-3-319-10602-1_26","volume-title":"Computer Vision \u2013 ECCV 2014","author":"CL Zitnick","year":"2014","unstructured":"Zitnick, C.L., Doll\u00e1r, P.: Edge boxes: locating object proposals from edges. In: Fleet, D., Pajdla, T., Schiele, B., Tuytelaars, T. (eds.) ECCV 2014. LNCS, vol. 8693, pp. 391\u2013405. Springer, Heidelberg (2014). doi:10.1007\/978-3-319-10602-1_26"},{"key":"8_CR8","doi-asserted-by":"publisher","first-page":"1312","DOI":"10.1109\/TPAMI.2011.231","volume":"34","author":"J Carreira","year":"2012","unstructured":"Carreira, J., Sminchisescu, C.: CPMC: automatic object segmentation using constrained parametric min-cuts. IEEE Trans. Pattern Anal. Mach. Intell. 34, 1312\u20131328 (2012)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"8_CR9","doi-asserted-by":"crossref","unstructured":"Pont-Tuset, J., Arbel\u00e1ez, P., Barron, J., Marques, F., Malik, J.: Multiscale combinatorial grouping for image segmentation and object proposal generation (2015). arXiv:1503.00848","DOI":"10.1109\/CVPR.2014.49"},{"key":"8_CR10","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"575","DOI":"10.1007\/978-3-642-15555-0_42","volume-title":"Computer Vision \u2013 ECCV 2010","author":"I Endres","year":"2010","unstructured":"Endres, I., Hoiem, D.: Category independent object proposals. In: Daniilidis, K., Maragos, P., Paragios, N. (eds.) ECCV 2010. LNCS, vol. 6315, pp. 575\u2013588. Springer, Heidelberg (2010). doi:10.1007\/978-3-642-15555-0_42"},{"key":"8_CR11","doi-asserted-by":"crossref","unstructured":"Kr\u00e4henb\u00fchl, P., Koltun, V.: Learning to propose objects. In: CVPR (2015)","DOI":"10.1109\/CVPR.2015.7298765"},{"key":"8_CR12","unstructured":"Pinheiro, P.O., Collobert, R., Dollar, P.: Learning to segment object candidates. In: Advances in Neural Information Processing Systems, pp. 1981\u20131989 (2015)"},{"key":"8_CR13","doi-asserted-by":"crossref","unstructured":"Dai, J., He, K., Sun, J.: Instance-aware semantic segmentation via multi-task network cascades, arXiv preprint (2015). arXiv:1512.04412","DOI":"10.1109\/CVPR.2016.343"},{"key":"8_CR14","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"467","DOI":"10.1007\/978-3-642-33715-4_34","volume-title":"Computer Vision \u2013 ECCV 2012","author":"M Bleyer","year":"2012","unstructured":"Bleyer, M., Rhemann, C., Rother, C.: Extracting 3D scene-consistent object proposals and depth from stereo images. In: Fitzgibbon, A., Lazebnik, S., Perona, P., Sato, Y., Schmid, C. (eds.) ECCV 2012. LNCS, vol. 7576, pp. 467\u2013481. Springer, Heidelberg (2012). doi:10.1007\/978-3-642-33715-4_34"},{"key":"8_CR15","unstructured":"Chen, X., Kundu, K., Zhu, Y., Berneshawi, A., Ma, H., Fidler, S., Urtasun, R.: 3d object proposals for accurate object class detection. In: NIPS (2015)"},{"key":"8_CR16","doi-asserted-by":"crossref","unstructured":"Cordts, M., Omran, M., Ramos, S., Rehfeld, T., Enzweiler, M., Benenson, R., Franke, U., Roth, S., Schiele, B.: The cityscapes dataset for semantic urban scene understanding, arXiv preprint (2016). arXiv:1604.01685","DOI":"10.1109\/CVPR.2016.350"},{"key":"8_CR17","unstructured":"Hosang, J., Benenson, R., Doll\u00e1r, P., Schiele, B.: What makes for effective detection proposals? arXiv preprint (2015). arXiv:1502.05082"},{"key":"8_CR18","doi-asserted-by":"crossref","unstructured":"Humayun, A., Li, F., Rehg, J.M.: The middle child problem: revisiting parametric min-cut and seeds for object proposals. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1600\u20131608 (2015)","DOI":"10.1109\/ICCV.2015.187"},{"key":"8_CR19","doi-asserted-by":"crossref","unstructured":"Lee, T., Fidler, S., Dickinson, S.: Learning to combine mid-level cues for object proposal generation. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 1680\u20131688 (2015)","DOI":"10.1109\/ICCV.2015.196"},{"key":"8_CR20","doi-asserted-by":"crossref","unstructured":"Wang, C., Zhao, L., Liang, S., Zhang, L., Jia, J., Wei, Y.: Object proposal by multi-branch hierarchical segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 3873\u20133881 (2015)","DOI":"10.1109\/CVPR.2015.7299012"},{"key":"8_CR21","doi-asserted-by":"crossref","unstructured":"Rantalankila, P., Kannala, J., Rahtu, E.: Generating object segmentation proposals using global and local search. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 2417\u20132424 (2014)","DOI":"10.1109\/CVPR.2014.310"},{"key":"8_CR22","doi-asserted-by":"crossref","unstructured":"Yanulevskaya, V., Uijlings, J., Sebe, N.: Learning to group objects. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 3134\u20133141 (2014)","DOI":"10.1109\/CVPR.2014.401"},{"key":"8_CR23","doi-asserted-by":"crossref","unstructured":"Kuo, W., Hariharan, B., Malik, J.: Deepbox: Learning objectness with convolutional networks, arXiv preprint (2015). arXiv:1505.02146","DOI":"10.1109\/ICCV.2015.285"},{"key":"8_CR24","doi-asserted-by":"crossref","unstructured":"Ghodrati, A., Diba, A., Pedersoli, M., Tuytelaars, T., Van Gool, L.: Deepproposal: hunting objects by cascading deep convolutional layers. In: Proceedings of the IEEE International Conference on Computer Vision, pp. 2578\u20132586 (2015)","DOI":"10.1109\/ICCV.2015.296"},{"key":"8_CR25","unstructured":"Sharma, A., Tuzel, O., Liu, M.Y.: Recursive context propagation network for semantic scene labeling. In: Advances in Neural Information Processing Systems, pp. 2447\u20132455 (2014)"},{"key":"8_CR26","doi-asserted-by":"crossref","unstructured":"Zagoruyko, S., Komodakis, N.: Learning to compare image patches via convolutional neural networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4353\u20134361 (2015)","DOI":"10.1109\/CVPR.2015.7299064"},{"key":"8_CR27","doi-asserted-by":"crossref","unstructured":"Long, J., Shelhamer, E., Darrell, T.: Fully convolutional networks for semantic segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 3431\u20133440 (2015)","DOI":"10.1109\/CVPR.2015.7298965"},{"key":"8_CR28","doi-asserted-by":"crossref","unstructured":"Hariharan, B., Arbel\u00e1ez, P., Girshick, R., Malik, J.: Hypercolumns for object segmentation and fine-grained localization. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 447\u2013456 (2015)","DOI":"10.1109\/CVPR.2015.7298642"},{"key":"8_CR29","doi-asserted-by":"crossref","unstructured":"Mottaghi, R., Chen, X., Liu, X., Cho, N.G., Lee, S.W., Fidler, S., Urtasun, R., Yuille, A.: The role of context for object detection and semantic segmentation in the wild. In: IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2014)","DOI":"10.1109\/CVPR.2014.119"},{"key":"8_CR30","doi-asserted-by":"crossref","unstructured":"Dai, J., He, K., Sun, J.: Convolutional feature masking for joint object and stuff segmentation. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 3992\u20134000 (2015)","DOI":"10.1109\/CVPR.2015.7299025"},{"key":"8_CR31","doi-asserted-by":"publisher","first-page":"1558","DOI":"10.1109\/TPAMI.2014.2377715","volume":"37","author":"P Doll\u00e1r","year":"2015","unstructured":"Doll\u00e1r, P., Zitnick, C.L.: Fast edge detection using structured forests. IEEE Trans. Pattern Anal. Mach. Intell. 37, 1558\u20131570 (2015)","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"8_CR32","doi-asserted-by":"crossref","unstructured":"Vedaldi, A., Lenc, K.: Matconvnet: convolutional neural networks for matlab. In: Proceedings of the 23rd Annual ACM Conference on Multimedia Conference, pp. 689\u2013692. ACM (2015)","DOI":"10.1145\/2733373.2807412"},{"key":"8_CR33","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"756","DOI":"10.1007\/978-3-319-10602-1_49","volume-title":"Computer Vision \u2013 ECCV 2014","author":"K Yamaguchi","year":"2014","unstructured":"Yamaguchi, K., McAllester, D., Urtasun, R.: Efficient joint segmentation, occlusion labeling, stereo and flow estimation. In: Fleet, D., Pajdla, T., Schiele, B., Tuytelaars, T. (eds.) ECCV 2014. LNCS, vol. 8693, pp. 756\u2013771. Springer, Heidelberg (2014). doi:10.1007\/978-3-319-10602-1_49"},{"key":"8_CR34","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"725","DOI":"10.1007\/978-3-319-10602-1_47","volume-title":"Computer Vision \u2013 ECCV 2014","author":"P Kr\u00e4henb\u00fchl","year":"2014","unstructured":"Kr\u00e4henb\u00fchl, P., Koltun, V.: Geodesic object proposals. In: Fleet, D., Pajdla, T., Schiele, B., Tuytelaars, T. (eds.) ECCV 2014. LNCS, vol. 8693, pp. 725\u2013739. Springer, Heidelberg (2014). doi:10.1007\/978-3-319-10602-1_47"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ACCV 2016"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-319-54181-5_8","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,11]],"date-time":"2024-03-11T15:26:27Z","timestamp":1710170787000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-319-54181-5_8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2017]]},"ISBN":["9783319541808","9783319541815"],"references-count":34,"URL":"https:\/\/doi.org\/10.1007\/978-3-319-54181-5_8","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2017]]},"assertion":[{"value":"10 March 2017","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ACCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Asian Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Taipei","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Taiwan","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2016","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"20 November 2016","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"24 November 2016","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"13","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"accv2016","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"http:\/\/www.accv2016.org\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}