{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,18]],"date-time":"2025-06-18T04:21:27Z","timestamp":1750220487161,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":46,"publisher":"ACM","license":[{"start":{"date-parts":[[2021,10,17]],"date-time":"2021-10-17T00:00:00Z","timestamp":1634428800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2021,10,17]]},"DOI":"10.1145\/3474085.3475521","type":"proceedings-article","created":{"date-parts":[[2021,10,18]],"date-time":"2021-10-18T06:21:10Z","timestamp":1634538070000},"page":"318-326","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["MeronymNet"],"prefix":"10.1145","author":[{"given":"Rishabh","family":"Baghel","sequence":"first","affiliation":[{"name":"International Institute of Information Technology, Hyderabad, Hyderabad, India"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Abhishek","family":"Trivedi","sequence":"additional","affiliation":[{"name":"International Institute of Information Technology, Hyderabad, Hyderabad, India"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Tejas","family":"Ravichandran","sequence":"additional","affiliation":[{"name":"International Institute of Information Technology, Hyderabad, Hyderabad, India"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Ravi Kiran","family":"Sarvadevabhatla","sequence":"additional","affiliation":[{"name":"International Institute of Information Technology, Hyderabad, Hyderabad, India"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2021,10,17]]},"reference":[{"volume-title":"Semantic Bottleneck Scene Generation. ArXiv","year":"2019","author":"Azadi Samaneh","key":"e_1_3_2_1_1_1"},{"volume-title":"A generative model of worldwide facial appearance","author":"Bessinger Zachary","key":"e_1_3_2_1_2_1","doi-asserted-by":"crossref","DOI":"10.1109\/WACV.2019.00172"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.cviu.2018.10.009"},{"volume-title":"Large Scale GAN Training for High Fidelity Natural Image Synthesis. In International Conference on Learning Representations.","year":"2018","author":"Brock Andrew","key":"e_1_3_2_1_4_1"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/CoG47356.2020.9231807"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.254"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58571-6_10"},{"volume-title":"Tutorial on variational autoencoders. arXiv preprint arXiv:1606.05908","year":"2016","author":"Doersch Carl","key":"e_1_3_2_1_8_1"},{"volume-title":"Proceedings of the IEEE International Conference on Computer Vision Workshops. 0--0.","year":"2019","author":"Dornadula Apoorva","key":"e_1_3_2_1_9_1"},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"crossref","unstructured":"Hao Fu Chunyuan Li Xiaodong Liu Jianfeng Gao Asli Celikyilmaz and Lawrence Carin. 2019. Cyclical Annealing Schedule: A Simple Approach to Mitigating KL Vanishing. In NAACL. 240--250.  Hao Fu Chunyuan Li Xiaodong Liu Jianfeng Gao Asli Celikyilmaz and Lawrence Carin. 2019. Cyclical Annealing Schedule: A Simple Approach to Mitigating KL Vanishing. In NAACL. 240--250.","DOI":"10.18653\/v1\/N19-1021"},{"key":"e_1_3_2_1_11_1","unstructured":"Jiuxiang Gu Handong Zhao Zhe Lin Sheng Li Jianfei Cai and Mingyang Ling. 2019. Scene graph generation with external knowledge and image reconstruction. In CVPR. 1969--1978.  Jiuxiang Gu Handong Zhao Zhe Lin Sheng Li Jianfei Cai and Mingyang Ling. 2019. Scene graph generation with external knowledge and image reconstruction. In CVPR. 1969--1978."},{"volume-title":"Attgan: Facial attribute editing by only changing what you want","year":"2019","author":"He Zhenliang","key":"e_1_3_2_1_12_1"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.5555\/3295222.3295408"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"crossref","unstructured":"Seunghoon Hong Dingdong Yang Jongwook Choi and Honglak Lee. 2018. Inferring semantic layout for hierarchical text-to-image synthesis. In CVPR. 7986--7994.  Seunghoon Hong Dingdong Yang Jongwook Choi and Honglak Lee. 2018. Inferring semantic layout for hierarchical text-to-image synthesis. In CVPR. 7986--7994.","DOI":"10.1109\/CVPR.2018.00833"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"crossref","unstructured":"Phillip Isola Jun-Yan Zhu Tinghui Zhou and Alexei A Efros. 2017. Image-to-image translation with conditional adversarial networks. In CVPR. 1125--1134.  Phillip Isola Jun-Yan Zhu Tinghui Zhou and Alexei A Efros. 2017. Image-to-image translation with conditional adversarial networks. In CVPR. 1125--1134.","DOI":"10.1109\/CVPR.2017.632"},{"key":"e_1_3_2_1_16_1","doi-asserted-by":"crossref","unstructured":"Akash Abdu Jyothi Thibaut Durand Jiawei He Leonid Sigal and Greg Mori. 2019. LayoutVAE: Stochastic Scene Layout Generation From a Label Set. In ICCV.  Akash Abdu Jyothi Thibaut Durand Jiawei He Leonid Sigal and Greg Mori. 2019. LayoutVAE: Stochastic Scene Layout Generation From a Label Set. In ICCV.","DOI":"10.1109\/ICCV.2019.00999"},{"volume-title":"Adam: A method for stochastic optimization. arXiv preprint arXiv:1412.6980","year":"2014","author":"Kingma Diederik P","key":"e_1_3_2_1_17_1"},{"volume-title":"Auto-encoding variational bayes. ICLR","year":"2014","author":"Kingma Diederik P","key":"e_1_3_2_1_18_1"},{"volume-title":"Variational graph auto-encoders. arXiv preprint arXiv:1611.07308","year":"2016","author":"Kipf Thomas N","key":"e_1_3_2_1_19_1"},{"volume-title":"Kipf and Max Welling","year":"2017","author":"Thomas","key":"e_1_3_2_1_20_1"},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1145\/3072959.3073637"},{"volume-title":"LayoutGAN: Generating Graphic Layouts with Wireframe Discriminators. ICLR","year":"2019","author":"Li Jianan","key":"e_1_3_2_1_22_1"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.5555\/3327757.3327877"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1145\/3355089.3356527"},{"key":"e_1_3_2_1_25_1","unstructured":"Kaichun Mo Shilin Zhu Angel X. Chang Li Yi Subarna Tripathi Leonidas J. Guibas and Hao Su. 2019 b. PartNet: A Large-Scale Benchmark for Fine-Grained and Hierarchical Part-Level 3D Object Understanding. In CVPR.  Kaichun Mo Shilin Zhu Angel X. Chang Li Yi Subarna Tripathi Leonidas J. Guibas and Hao Su. 2019 b. PartNet: A Large-Scale Benchmark for Fine-Grained and Hierarchical Part-Level 3D Object Understanding. In CVPR."},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1111\/cgf.13240"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.5555\/3305890.3305954"},{"key":"e_1_3_2_1_28_1","unstructured":"Hyojin Park Youngjoon Yoo and Nojun Kwak. 2018. MC-GAN: Multi-conditional Generative Adversarial Network for Image Synthesis. In BMVC.  Hyojin Park Youngjoon Yoo and Nojun Kwak. 2018. MC-GAN: Multi-conditional Generative Adversarial Network for Image Synthesis. In BMVC."},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"crossref","unstructured":"Taesung Park Ming-Yu Liu Ting-Chun Wang and Jun-Yan Zhu. 2019. Semantic Image Synthesis with Spatially-Adaptive Normalization. In CVPR.  Taesung Park Ming-Yu Liu Ting-Chun Wang and Jun-Yan Zhu. 2019. Semantic Image Synthesis with Spatially-Adaptive Normalization. In CVPR.","DOI":"10.1109\/CVPR.2019.00244"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"crossref","unstructured":"Daniel Ritchie Kai Wang and Yu-an Lin. 2019. Fast and flexible indoor scene synthesis via deep convolutional generative models. In CVPR. 6182--6190.  Daniel Ritchie Kai Wang and Yu-an Lin. 2019. Fast and flexible indoor scene synthesis via deep convolutional generative models. In CVPR. 6182--6190.","DOI":"10.1109\/CVPR.2019.00634"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.5555\/2969442.2969628"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.01063"},{"volume-title":"Feastnet: Feature-steered graph convolutions for 3d shape analysis. In CVPR. 2598--2606.","year":"2018","author":"Verma Nitika","key":"e_1_3_2_1_33_1"},{"key":"e_1_3_2_1_34_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.00091"},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1145\/3306346.3322956"},{"volume-title":"Attribute2image: Conditional image generation from visual attributes","author":"Yan Xinchen","key":"e_1_3_2_1_36_1"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.5555\/3454287.3454407"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"crossref","unstructured":"Jianwei Yang Jiasen Lu Stefan Lee Dhruv Batra and Devi Parikh. 2018. Graph R-CNN for scene graph generation. In ECCV. 670--685.  Jianwei Yang Jiasen Lu Stefan Lee Dhruv Batra and Devi Parikh. 2018. Graph R-CNN for scene graph generation. In ECCV. 670--685.","DOI":"10.1007\/978-3-030-01246-5_41"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"crossref","unstructured":"Xu Yang Kaihua Tang Hanwang Zhang and Jianfei Cai. 2019 a. Auto-encoding scene graphs for image captioning. In CVPR. 10685--10694.  Xu Yang Kaihua Tang Hanwang Zhang and Jianfei Cai. 2019 a. Auto-encoding scene graphs for image captioning. In CVPR. 10685--10694.","DOI":"10.1109\/CVPR.2019.01094"},{"key":"e_1_3_2_1_40_1","unstructured":"Guojun Yin Bin Liu Lu Sheng Nenghai Yu Xiaogang Wang and Jing Shao. 2019. Semantics Disentangling for Text-to-Image Generation. In CVPR. 2327--2336.  Guojun Yin Bin Liu Lu Sheng Nenghai Yu Xiaogang Wang and Jing Shao. 2019. Semantics Disentangling for Text-to-Image Generation. In CVPR. 2327--2336."},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.1145\/2964284.2967274"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2018.2856256"},{"volume-title":"Dual Graph Convolutional Network for Semantic Segmentation. BMVC","year":"2019","author":"Zhang Li","key":"e_1_3_2_1_43_1"},{"volume-title":"Graph Node-Feature Convolution for Representation Learning. arXiv preprint arXiv:1812.00086","year":"2018","author":"Zhang Li","key":"e_1_3_2_1_44_1"},{"key":"e_1_3_2_1_45_1","doi-asserted-by":"crossref","unstructured":"Bo Zhao Lili Meng Weidong Yin and Leonid Sigal. 2019 a. Image Generation from Layout. In CVPR.  Bo Zhao Lili Meng Weidong Yin and Leonid Sigal. 2019 a. Image Generation from Layout. In CVPR.","DOI":"10.1109\/CVPR.2019.00878"},{"key":"e_1_3_2_1_46_1","doi-asserted-by":"crossref","unstructured":"Long Zhao Xi Peng Yu Tian Mubbasir Kapadia and Dimitris N Metaxas. 2019 b. Semantic Graph Convolutional Networks for 3D Human Pose Regression. In CVPR. 3425--3435.  Long Zhao Xi Peng Yu Tian Mubbasir Kapadia and Dimitris N Metaxas. 2019 b. Semantic Graph Convolutional Networks for 3D Human Pose Regression. In CVPR. 3425--3435.","DOI":"10.1109\/CVPR.2019.00354"}],"event":{"name":"MM '21: ACM Multimedia Conference","sponsor":["SIGMM ACM Special Interest Group on Multimedia"],"location":"Virtual Event China","acronym":"MM '21"},"container-title":["Proceedings of the 29th ACM International Conference on Multimedia"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3474085.3475521","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3474085.3475521","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,17]],"date-time":"2025-06-17T20:49:10Z","timestamp":1750193350000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3474085.3475521"}},"subtitle":["A Hierarchical Model for Unified and Controllable Multi-Category Object Generation"],"short-title":[],"issued":{"date-parts":[[2021,10,17]]},"references-count":46,"alternative-id":["10.1145\/3474085.3475521","10.1145\/3474085"],"URL":"https:\/\/doi.org\/10.1145\/3474085.3475521","relation":{},"subject":[],"published":{"date-parts":[[2021,10,17]]},"assertion":[{"value":"2021-10-17","order":2,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}