{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,6]],"date-time":"2026-05-06T15:21:04Z","timestamp":1778080864502,"version":"3.51.4"},"reference-count":77,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"3","license":[{"start":{"date-parts":[[2021,3,1]],"date-time":"2021-03-01T00:00:00Z","timestamp":1614556800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,3,1]],"date-time":"2021-03-01T00:00:00Z","timestamp":1614556800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,3,1]],"date-time":"2021-03-01T00:00:00Z","timestamp":1614556800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61772359"],"award-info":[{"award-number":["61772359"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61872267"],"award-info":[{"award-number":["61872267"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["61902277"],"award-info":[{"award-number":["61902277"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"grant of Tianjin New Generation Artificial Intelligence Major Program","award":["19ZXZNGX00110"],"award-info":[{"award-number":["19ZXZNGX00110"]}]},{"name":"grant of Tianjin New Generation Artificial Intelligence Major Program","award":["18ZXZNGX00150"],"award-info":[{"award-number":["18ZXZNGX00150"]}]},{"DOI":"10.13039\/501100004835","name":"Open Project Program of the State Key Lab of CAD and CG, Zhejiang University","doi-asserted-by":"publisher","award":["A2005"],"award-info":[{"award-number":["A2005"]}],"id":[{"id":"10.13039\/501100004835","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100004835","name":"Open Project Program of the State Key Lab of CAD and CG, Zhejiang University","doi-asserted-by":"publisher","award":["A2012"],"award-info":[{"award-number":["A2012"]}],"id":[{"id":"10.13039\/501100004835","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Circuits Syst. Video Technol."],"published-print":{"date-parts":[[2021,3]]},"DOI":"10.1109\/tcsvt.2020.2990989","type":"journal-article","created":{"date-parts":[[2020,4,28]],"date-time":"2020-04-28T20:29:36Z","timestamp":1588105776000},"page":"1031-1041","source":"Crossref","is-referenced-by-count":25,"title":["Scene Graph Inference via Multi-Scale Context Modeling"],"prefix":"10.1109","volume":"31","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-7526-4356","authenticated-orcid":false,"given":"Ning","family":"Xu","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5755-9145","authenticated-orcid":false,"given":"An-An","family":"Liu","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1239-4428","authenticated-orcid":false,"given":"Yongkang","family":"Wong","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-0578-8138","authenticated-orcid":false,"given":"Weizhi","family":"Nie","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5165-204X","authenticated-orcid":false,"given":"Yuting","family":"Su","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4846-2015","authenticated-orcid":false,"given":"Mohan","family":"Kankanhalli","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2017.2771332"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.454"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.331"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2018.2817340"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.71"},{"key":"ref77","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2013.211"},{"key":"ref74","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2018.2797248"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00725"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.651"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1145\/3123266.3123436"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.142"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01246-5_21"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.766"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.289"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2018\/114"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2537337"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2018.2810191"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2017.2708714"},{"key":"ref60","first-page":"690","article-title":"Graph R-CNN for scene graph generation","volume":"11205","author":"yang","year":"2018","journal-title":"Proc ECCV"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01258-8_3"},{"key":"ref61","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01094"},{"key":"ref63","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2010.5540234"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2011.5995466"},{"key":"ref64","first-page":"702","article-title":"Describing the scene as a whole: Joint object detection, scene classification and semantic segmentation","author":"yao","year":"2012","journal-title":"Proc IEEE Conf Comput Vis Pattern Recognit"},{"key":"ref27","first-page":"1106","article-title":"ImageNet classification with deep convolutional neural networks","author":"krizhevsky","year":"2012","journal-title":"Proc NIPS"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1109\/TCYB.2020.2969046"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2019.2947482"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2018.2868854"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2019.2932058"},{"key":"ref68","doi-asserted-by":"publisher","DOI":"10.1109\/TNNLS.2019.2908982"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.121"},{"key":"ref2","article-title":"Learning to generalize to new compositions in image understanding","author":"atzmon","year":"2016","journal-title":"arXiv 1608 07639"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46454-1_24"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/TIE.2014.2378735"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/TII.2018.2884211"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2015.2487860"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298990"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.37"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-016-0981-7"},{"key":"ref25","first-page":"1889","article-title":"Deep fragment embeddings for bidirectional image sentence mapping","author":"karpathy","year":"2014","journal-title":"Proc NIPS"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00857"},{"key":"ref51","first-page":"1","article-title":"Very deep convolutional networks for large-scale image recognition","author":"simonyan","year":"2015","journal-title":"Proc ICLR"},{"key":"ref59","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2019.2924576"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2019.2903448"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2017.2720749"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2019.2941820"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2018.2867286"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.330"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00212"},{"key":"ref52","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2019.2943753"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00626"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1016\/j.cviu.2010.02.004"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46448-0_51"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.169"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.81"},{"key":"ref14","first-page":"1080","article-title":"Contextual action recognition with $\\text{R}^{\\ast}$\nCNN","author":"gkioxari","year":"2015","journal-title":"Proc IEEE Int Conf Comput Vis (ICCV)"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-013-0658-4"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-540-88682-2_3"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.322"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1162\/neco.1997.9.8.1735"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00471"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2012.6248100"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2017.352"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2010.5540221"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00254"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2013.340"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2011.5995711"},{"key":"ref9","first-page":"1292","article-title":"Image description using visual dependency representations","author":"elliott","year":"2013","journal-title":"Proc EMNLP"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00408"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-016-0965-7"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2577031"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7298713"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2014.313"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/TCSVT.2017.2749980"},{"key":"ref44","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.213"},{"key":"ref43","first-page":"1","article-title":"Automatic differentiation in PyTorch","author":"paszke","year":"2017","journal-title":"Proc NIPS Autodiff Workshop"}],"container-title":["IEEE Transactions on Circuits and Systems for Video Technology"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/76\/9370015\/09079879.pdf?arnumber=9079879","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,5,10]],"date-time":"2022-05-10T14:50:28Z","timestamp":1652194228000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9079879\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,3]]},"references-count":77,"journal-issue":{"issue":"3"},"URL":"https:\/\/doi.org\/10.1109\/tcsvt.2020.2990989","relation":{},"ISSN":["1051-8215","1558-2205"],"issn-type":[{"value":"1051-8215","type":"print"},{"value":"1558-2205","type":"electronic"}],"subject":[],"published":{"date-parts":[[2021,3]]}}}