{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,15]],"date-time":"2025-11-15T07:24:05Z","timestamp":1763191445817,"version":"3.45.0"},"reference-count":30,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,6,30]],"date-time":"2025-06-30T00:00:00Z","timestamp":1751241600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,6,30]],"date-time":"2025-06-30T00:00:00Z","timestamp":1751241600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100012226","name":"Fundamental Research Funds for the Central Universities","doi-asserted-by":"publisher","id":[{"id":"10.13039\/501100012226","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,6,30]]},"DOI":"10.1109\/ijcnn64981.2025.11227744","type":"proceedings-article","created":{"date-parts":[[2025,11,14]],"date-time":"2025-11-14T18:46:15Z","timestamp":1763145975000},"page":"1-8","source":"Crossref","is-referenced-by-count":0,"title":["MSALNet: Capturing Contextual Relationships for Monocular 3D Visual Grounding"],"prefix":"10.1109","author":[{"given":"Keyu","family":"Guo","sequence":"first","affiliation":[{"name":"Chang&#x2019;an University,Xi&#x2019;an,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yongle","family":"Huang","sequence":"additional","affiliation":[{"name":"Chang&#x2019;an University,Xi&#x2019;an,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Yongfeng","family":"Bu","sequence":"additional","affiliation":[{"name":"Chang&#x2019;an University,Xi&#x2019;an,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Hongkai","family":"Wei","sequence":"additional","affiliation":[{"name":"Chang&#x2019;an University,Xi&#x2019;an,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Shijie","family":"Sun","sequence":"additional","affiliation":[{"name":"Chang&#x2019;an University,Xi&#x2019;an,China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xiangyu","family":"Song","sequence":"additional","affiliation":[{"name":"Chang&#x2019;an University,Xi&#x2019;an,China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00808"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1145\/3503161.3548316"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TIM.2023.3324362"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-78462-1_15"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1134\/S1019331618010094"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.3390\/mti9010006"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.2983149"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1016\/j.compeleceng.2025.110116"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1021\/acssensors.4c01202"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/jsen.2024.3360457"},{"key":"ref11","first-page":"02783649241230562","article-title":"A survey on socially aware robot navigation: Taxonomy and future challenges","author":"S","year":"2024","journal-title":"The International Journal of Robotics Research"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/RAIIC61787.2024.10671357"},{"key":"ref13","first-page":"1769","article-title":"Transvg: End-to-end visual grounding with transformers","volume-title":"Proceedings of the IEEE\/CVF International Conference on Computer Vision","author":"D"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2023.3321501"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i5.28278"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01506"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01843"},{"article-title":"A unified framework for 3d point cloud visual grounding","year":"2023","author":"L","key":"ref18"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01597"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i7.28525"},{"article-title":"Mamba: Linear-time sequence modeling with selective state spaces","year":"2023","author":"Gu","key":"ref21"},{"article-title":"Ml-mamba: Efficient multi-modal large language model utilizing mamba-2","year":"2024","author":"H","key":"ref22"},{"article-title":"Vl-mamba: Exploring state space models for multimodal learning","year":"2024","author":"Q","key":"ref23"},{"key":"ref24","first-page":"471","article-title":"A robustly optimized bert pre-training approach with post-training","volume-title":"China National Conference on Chinese Computational Linguistics","author":"L"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2022.3152247"},{"article-title":"Improved baselines with momentum contrastive learning","year":"2020","author":"Chen","key":"ref26"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01264"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2019.00479"},{"key":"ref29","first-page":"4683","article-title":"A fast and accurate one-stage approach to visual grounding","volume-title":"Proceedings of the IEEE\/CVF international conference on computer vision","author":"Y"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58568-6_23"}],"event":{"name":"2025 International Joint Conference on Neural Networks (IJCNN)","start":{"date-parts":[[2025,6,30]]},"location":"Rome, Italy","end":{"date-parts":[[2025,7,5]]}},"container-title":["2025 International Joint Conference on Neural Networks (IJCNN)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11227166\/11227148\/11227744.pdf?arnumber=11227744","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,15]],"date-time":"2025-11-15T07:22:12Z","timestamp":1763191332000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11227744\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,6,30]]},"references-count":30,"URL":"https:\/\/doi.org\/10.1109\/ijcnn64981.2025.11227744","relation":{},"subject":[],"published":{"date-parts":[[2025,6,30]]}}}