{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T21:55:50Z","timestamp":1775253350541,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":46,"publisher":"ACM","license":[{"start":{"date-parts":[[2018,10,15]],"date-time":"2018-10-15T00:00:00Z","timestamp":1539561600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2018,10,15]]},"DOI":"10.1145\/3240508.3240652","type":"proceedings-article","created":{"date-parts":[[2018,10,18]],"date-time":"2018-10-18T13:52:08Z","timestamp":1539870728000},"page":"1670-1678","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":90,"title":["ModaNet"],"prefix":"10.1145","author":[{"given":"Shuai","family":"Zheng","sequence":"first","affiliation":[{"name":"eBay Inc., San Jose, CA, USA"}]},{"given":"Fan","family":"Yang","sequence":"additional","affiliation":[{"name":"eBay Inc., San Jose, CA, USA"}]},{"given":"M. Hadi","family":"Kiapour","sequence":"additional","affiliation":[{"name":"eBay Inc., San Francisco, CA, USA"}]},{"given":"Robinson","family":"Piramuthu","sequence":"additional","affiliation":[{"name":"eBay Inc., San Francisco, CA, USA"}]}],"member":"320","published-online":{"date-parts":[[2018,10,15]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"crossref","unstructured":"David Acuna Huan Ling Amlan Kar and Sanja Fidler. 2018. Efficient Interactive Annotation of Segmentation Datasets with Polygon-RNN++. In CVPR. David Acuna Huan Ling Amlan Kar and Sanja Fidler. 2018. Efficient Interactive Annotation of Segmentation Datasets with Polygon-RNN++. In CVPR.","DOI":"10.1109\/CVPR.2018.00096"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"crossref","unstructured":"Navaneeth Bodla Bharat Singh Rama Chellappa and Larry S. Davis. 2017. Soft- NMS - Improving Object Detection with One Line of Code. In ICCV. 5562--5570. Navaneeth Bodla Bharat Singh Rama Chellappa and Larry S. Davis. 2017. Soft- NMS - Improving Object Detection with One Line of Code. In ICCV. 5562--5570.","DOI":"10.1109\/ICCV.2017.593"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"crossref","unstructured":"Lluis Castrejon Kaustav Kundu Raquel Urtasun and Sanja Fidler. 2017. Annotating Object Instances with a Polygon-RNN. In CVPR. Lluis Castrejon Kaustav Kundu Raquel Urtasun and Sanja Fidler. 2017. Annotating Object Instances with a Polygon-RNN. In CVPR.","DOI":"10.1109\/CVPR.2017.477"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2017.2699184"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"crossref","unstructured":"Liang-Chieh Chen Yukun Zhu George Papandreou Florian Schroff and Hartwig Adam. 2018. Encoder-Decoder with Atrous Separable Convolution for Semantic Image Segmentation. In CVPR. Liang-Chieh Chen Yukun Zhu George Papandreou Florian Schroff and Hartwig Adam. 2018. Encoder-Decoder with Atrous Separable Convolution for Semantic Image Segmentation. In CVPR.","DOI":"10.1007\/978-3-030-01234-2_49"},{"key":"e_1_3_2_1_6_1","volume-title":"Xception: Deep Learning with Depthwise Separable Convolutions. In CVPR.","author":"Chollet Francois","year":"2017"},{"key":"e_1_3_2_1_7_1","unstructured":"Jifeng Dai Yi Li Kaiming He and Jian Sun. 2016. R-FCN: Object Detection via Region-based Fully Convolutional Networks. In NIPS. Jifeng Dai Yi Li Kaiming He and Jian Sun. 2016. R-FCN: Object Detection via Region-based Fully Convolutional Networks. In NIPS."},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"crossref","unstructured":"Jifeng Dai Haozhi Qi Yuwen Xiong Yi Li Guodong Zhang Han Hu and Yichen Wei. 2017. Deformable Convolutional Networks. In ICCV. 764--773. Jifeng Dai Haozhi Qi Yuwen Xiong Yi Li Guodong Zhang Han Hu and Yichen Wei. 2017. Deformable Convolutional Networks. In ICCV. 764--773.","DOI":"10.1109\/ICCV.2017.89"},{"key":"e_1_3_2_1_9_1","volume-title":"Imagenet: A large-scale hierarchical image database. In CVPR.","author":"Deng Jia","year":"2009"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.423"},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.169"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.81"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"crossref","unstructured":"Kota Hara Vignesh Jagadeesh and Robinson Piramuthu. 2016. Fashion apparel detection: The role of deep convolutional neural network and pose-dependent priors. In WACV. 1--9. Kota Hara Vignesh Jagadeesh and Robinson Piramuthu. 2016. Fashion apparel detection: The role of deep convolutional neural network and pose-dependent priors. In WACV. 1--9.","DOI":"10.1109\/WACV.2016.7477611"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"crossref","unstructured":"Bharath Hariharan Pablo Arbelaez Ross Girshick and Jitendra Malik. 2014. Simultaneous Detection and Segmentation. In ECCV. Bharath Hariharan Pablo Arbelaez Ross Girshick and Jitendra Malik. 2014. Simultaneous Detection and Segmentation. In ECCV.","DOI":"10.1007\/978-3-319-10584-0_20"},{"key":"e_1_3_2_1_15_1","unstructured":"Kaiming He Xiangyu Zhang Shaoqing Ren and Jian Sun. 2016. Deep Residual Learning for Image Recognition. Kaiming He Xiangyu Zhang Shaoqing Ren and Jian Sun. 2016. Deep Residual Learning for Image Recognition."},{"key":"e_1_3_2_1_16_1","unstructured":"Xuming He Richard S Zemel and Miguel A Carreira-Perpinan. 2014. Multiscale Conditional Random Fields for Image Labeling. In CVPR. Xuming He Richard S Zemel and Miguel A Carreira-Perpinan. 2014. Multiscale Conditional Random Fields for Image Labeling. In CVPR."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.127"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.382"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"crossref","unstructured":"Lubor Ladicky Chris Russell Pushmeet Kohli and Philip HS Torr. 2009. Associative hierarchical crfs for object class image segmentation. In ICCV. Lubor Ladicky Chris Russell Pushmeet Kohli and Philip HS Torr. 2009. Associative hierarchical crfs for object class image segmentation. In ICCV.","DOI":"10.1109\/ICCV.2009.5459248"},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2015.2408360"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.163"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"crossref","unstructured":"G. Lin C. Shen A. van den Hengel and I. D. Reid. 2017. Exploring context with deep structured models for semantic segmentation. In CVPR. G. Lin C. Shen A. van den Hengel and I. D. Reid. 2017. Exploring context with deep structured models for semantic segmentation. In CVPR.","DOI":"10.1109\/CVPR.2016.348"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"crossref","unstructured":"Tsung-Yi Lin Piotr Doll\u00e1r Ross B. Girshick Kaiming He Bharath Hariharan and Serge J. Belongie. 2017. Feature Pyramid Networks for Object Detection. In CVPR. 936--944. Tsung-Yi Lin Piotr Doll\u00e1r Ross B. Girshick Kaiming He Bharath Hariharan and Serge J. Belongie. 2017. Feature Pyramid Networks for Object Detection. In CVPR. 936--944.","DOI":"10.1109\/CVPR.2017.106"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"crossref","unstructured":"Tsung-Yi Lin Priya Goyal Ross B. Girshick Kaiming He and Piotr Doll\u00e1r. 2017. Focal Loss for Dense Object Detection. In ICCV. 2999--3007. Tsung-Yi Lin Priya Goyal Ross B. Girshick Kaiming He and Piotr Doll\u00e1r. 2017. Focal Loss for Dense Object Detection. In ICCV. 2999--3007.","DOI":"10.1109\/ICCV.2017.324"},{"key":"e_1_3_2_1_25_1","unstructured":"Tsung-Yi Lin Michael Maire Serge Belongie James Hays Pietro Perona Deva Ramanan Piotr Dollar and C Lawrence Zitnick. 2014. Microsoft coco: Common objects in context. In ECCV. Tsung-Yi Lin Michael Maire Serge Belongie James Hays Pietro Perona Deva Ramanan Piotr Dollar and C Lawrence Zitnick. 2014. Microsoft coco: Common objects in context. In ECCV."},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2013.2285526"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/2647868.2654932"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"crossref","unstructured":"Wei Liu Dragomir Anguelov Dumitru Erhan Christian Szegedy Scott Reed Cheng-Yang Fu and Alexander C. Berg. 2016. SSD: Single Shot MultiBox Detector. In ECCV. Wei Liu Dragomir Anguelov Dumitru Erhan Christian Szegedy Scott Reed Cheng-Yang Fu and Alexander C. Berg. 2016. SSD: Single Shot MultiBox Detector. In ECCV.","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"e_1_3_2_1_29_1","first-page":"37","article-title":"Deep learning markov random field for semantic segmentation","volume":"35","author":"Liu Ziwei","year":"2017","journal-title":"IEEE Trans. Pattern Anal. Mach. Intell."},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"crossref","unstructured":"Ziwei Liu Ping Luo Shi Qiu XiaogangWang and Xiaoou Tang. 2016. DeepFashion: Powering Robust Clothes Recognition and Retrieval with Rich Annotations. In CVPR. 1096--1104. Ziwei Liu Ping Luo Shi Qiu XiaogangWang and Xiaoou Tang. 2016. DeepFashion: Powering Robust Clothes Recognition and Retrieval with Rich Annotations. In CVPR. 1096--1104.","DOI":"10.1109\/CVPR.2016.124"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"crossref","unstructured":"Joseph Redmon Santosh Divvala Ross Girshick and Ali Farhadi. 2016. You only look once: Unified real-time object detection. In CVPR. Joseph Redmon Santosh Divvala Ross Girshick and Ali Farhadi. 2016. You only look once: Unified real-time object detection. In CVPR.","DOI":"10.1109\/CVPR.2016.91"},{"key":"e_1_3_2_1_32_1","unstructured":"Shaoqing Ren Kaiming He Ross Girshick and Jian Sun. 2015. Faster R-CNN: Towards Real-Time Object Detection with Region Proposal Networks. In NIPS. Shaoqing Ren Kaiming He Ross Girshick and Jian Sun. 2015. Faster R-CNN: Towards Real-Time Object Detection with Region Proposal Networks. In NIPS."},{"key":"e_1_3_2_1_33_1","unstructured":"A. G. Schwing and R. Urtasun. 2015. Fully connected deep structured networks. In arXiv:1503.02351. A. G. Schwing and R. Urtasun. 2015. Fully connected deep structured networks. In arXiv:1503.02351."},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2572683"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1007\/11744023_1"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"crossref","unstructured":"Abhinav Shrivastava Abhinav Gupta and Ross B. Girshick. 2016. Training Region-Based Object Detectors with Online Hard Example Mining. In CVPR. 761--769. Abhinav Shrivastava Abhinav Gupta and Ross B. Girshick. 2016. Training Region-Based Object Detectors with Online Hard Example Mining. In CVPR. 761--769.","DOI":"10.1109\/CVPR.2016.89"},{"key":"e_1_3_2_1_37_1","unstructured":"Marcel Simon Erik Rodner and Joachim Denzler. 2016. ImageNet pre-trained models with batch normalization. arXiv preprint arXiv:1612.01452 (2016). Marcel Simon Erik Rodner and Joachim Denzler. 2016. ImageNet pre-trained models with batch normalization. arXiv preprint arXiv:1612.01452 (2016)."},{"key":"e_1_3_2_1_38_1","unstructured":"K. Simonyan and A. Zisserman. 2015. Very Deep Convolutional Networks for Large-Scale Image Recognition. In ICLR. K. Simonyan and A. Zisserman. 2015. Very Deep Convolutional Networks for Large-Scale Image Recognition. In ICLR."},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"crossref","unstructured":"Christian Szegedy Sergey Ioffe Vincent Vanhoucke and Alexander A Alemi. 2017. Inception-v4 inception-resnet and the impact of residual connections on learning. In AAAI. Christian Szegedy Sergey Ioffe Vincent Vanhoucke and Alexander A Alemi. 2017. Inception-v4 inception-resnet and the impact of residual connections on learning. In AAAI.","DOI":"10.1609\/aaai.v31i1.11231"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.437"},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"crossref","unstructured":"Kota Yamaguchi M. Hadi Kiapour Luis E. Ortiz and Tamara L. Berg. 2012. Parsing clothing in fashion photographs. In CVPR. 3570--3577. Kota Yamaguchi M. Hadi Kiapour Luis E. Ortiz and Tamara L. Berg. 2012. Parsing clothing in fashion photographs. In CVPR. 3570--3577.","DOI":"10.1109\/CVPR.2012.6248101"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.407"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.32"},{"key":"e_1_3_2_1_44_1","unstructured":"Fisher Yu and Vladlen Koltun. 2016. Multi-Scale Context Aggregation by Dilated Convolutions. In ICLR. Fisher Yu and Vladlen Koltun. 2016. Multi-Scale Context Aggregation by Dilated Convolutions. In ICLR."},{"key":"e_1_3_2_1_45_1","unstructured":"HengShuang Zhao Jianping Shi Xiaojuan Qi Xiaogang Wang and Jiaya Jia. 2017. Pyramid Scene Parsing Network. In CVPR. 1063--6919. HengShuang Zhao Jianping Shi Xiaojuan Qi Xiaogang Wang and Jiaya Jia. 2017. Pyramid Scene Parsing Network. In CVPR. 1063--6919."},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.179"}],"event":{"name":"MM '18: ACM Multimedia Conference","location":"Seoul Republic of Korea","acronym":"MM '18","sponsor":["SIGMM ACM Special Interest Group on Multimedia"]},"container-title":["Proceedings of the 26th ACM international conference on Multimedia"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3240508.3240652","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3240508.3240652","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,3]],"date-time":"2026-04-03T20:40:57Z","timestamp":1775248857000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3240508.3240652"}},"subtitle":["A Large-scale Street Fashion Dataset with Polygon Annotations"],"short-title":[],"issued":{"date-parts":[[2018,10,15]]},"references-count":46,"alternative-id":["10.1145\/3240508.3240652","10.1145\/3240508"],"URL":"https:\/\/doi.org\/10.1145\/3240508.3240652","relation":{},"subject":[],"published":{"date-parts":[[2018,10,15]]},"assertion":[{"value":"2018-10-15","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}