{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,1]],"date-time":"2026-04-01T09:48:07Z","timestamp":1775036887641,"version":"3.50.1"},"reference-count":57,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2024,1,1]],"date-time":"2024-01-01T00:00:00Z","timestamp":1704067200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc-nd\/4.0\/"}],"funder":[{"name":"industry grant through RMIT","award":["PRJ00000694"],"award-info":[{"award-number":["PRJ00000694"]}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Access"],"published-print":{"date-parts":[[2024]]},"DOI":"10.1109\/access.2024.3506563","type":"journal-article","created":{"date-parts":[[2024,11,27]],"date-time":"2024-11-27T19:41:56Z","timestamp":1732736516000},"page":"179464-179477","source":"Crossref","is-referenced-by-count":8,"title":["GroundingCarDD: Text-Guided Multimodal Phrase Grounding for Car Damage Detection"],"prefix":"10.1109","volume":"12","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-8430-9416","authenticated-orcid":false,"given":"Md Jahid","family":"Hasan","sequence":"first","affiliation":[{"name":"RMIT Enterprise AI and Data Analytics Hub, RMIT University, Melbourne, VIC, Australia"}]},{"given":"Agustinus","family":"Nalwan","sequence":"additional","affiliation":[{"name":"carsales, Richmond, VIC, Australia"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4688-7674","authenticated-orcid":false,"given":"Kok-Leong","family":"Ong","sequence":"additional","affiliation":[{"name":"RMIT Enterprise AI and Data Analytics Hub, RMIT University, Melbourne, VIC, Australia"}]},{"given":"Hamed","family":"Jahani","sequence":"additional","affiliation":[{"name":"RMIT Enterprise AI and Data Analytics Hub, RMIT University, Melbourne, VIC, Australia"}]},{"given":"Yee Ling","family":"Boo","sequence":"additional","affiliation":[{"name":"RMIT Enterprise AI and Data Analytics Hub, RMIT University, Melbourne, VIC, Australia"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2760-8724","authenticated-orcid":false,"given":"Kha Cong","family":"Nguyen","sequence":"additional","affiliation":[{"name":"RMIT Enterprise AI and Data Analytics Hub, RMIT University, Melbourne, VIC, Australia"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4302-8516","authenticated-orcid":false,"given":"Mahmudul","family":"Hasan","sequence":"additional","affiliation":[{"name":"School of Information Technology, Deakin University, Geelong, VIC, Australia"}]}],"member":"263","reference":[{"key":"ref1","volume-title":"Motor Vehicle Census, Australia, 31, Jan. 2021 |Australian Bureau of Statistics","year":"2021"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1108\/JFRC-11-2021-0102"},{"key":"ref3","article-title":"Second hand vehicle maintenance frauds","volume-title":"22nd JUMV Int. Automot. Conf","author":"Duboka"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-16-3153-5_31"},{"key":"ref5","volume-title":"One in Four Are Buying Cars Online but Dealerships Will Remain Vital for Move to Evs\u2014Ey Mobility Consumer Index |Ey Australia","year":"2024"},{"key":"ref6","volume-title":"Carsales.Com.Au","year":"2023"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1155\/2022\/5004129"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1117\/12.2558395"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.2964055"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CCECE47787.2020.9255806"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1145\/3406601.3406651"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICCIKE58312.2023.10131804"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.37936\/ecti-cit.2021153.223151"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1145\/3589845.3589848"},{"key":"ref15","volume-title":"Detectron2","author":"Wu","year":"2019"},{"key":"ref16","first-page":"1","article-title":"Faster r-CNN: Towards real-time object detection with region proposal networks","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"28","author":"Ren"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58452-8_13"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.91"},{"key":"ref19","article-title":"SAM2: Segment anything in images and videos","author":"Ravi","year":"2024","journal-title":"arXiv:2408.00714"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/NITC.2017.8285649"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/ICCES57224.2023.10192858"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-85365-5_14"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ICCSEA54677.2022.9936208"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICMLA.2017.0-179"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/ICOEI51242.2021.9452846"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1093\/jcde\/qwad063"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-23756-1_39"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/ICE3IS59323.2023.10335254"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/ICE3IS59323.2023.10335327"},{"key":"ref30","first-page":"28","article-title":"Mars: Mask attention refinement with sequential quadtree nodes for car damage instance segmentation","volume-title":"Proc. Int. Conf. Image Anal. Process","author":"Panboonyuen"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1145\/3609703.3609709"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/TITS.2023.3258480"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/KSE59128.2023.10299490"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/DeSE58274.2023.10100274"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-15-7062-9_61"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1088\/1742-6596\/1880\/1\/012024"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-15-8697-2_14"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1007\/s41315-022-00231-5"},{"key":"ref39","volume-title":"Labelme: Image Polygonal Annotation With Python (polygon, Rectangle, Circle, Line, Point and Image-level Flag Annotation)","year":"2024"},{"key":"ref40","article-title":"MiniGPT-4: Enhancing vision-language understanding with advanced large language models","author":"Zhu","year":"2023","journal-title":"arXiv:2304.10592"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46448-0_2"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.322"},{"key":"ref43","article-title":"Deformable DETR: Deformable transformers for end-to-end object detection","author":"Zhu","year":"2020","journal-title":"arXiv:2010.04159"},{"key":"ref44","article-title":"BERT: Pre-training of deep bidirectional transformers for language understanding","author":"Devlin","year":"2018","journal-title":"arXiv:1810.04805"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01069"},{"key":"ref46","article-title":"GRILL: Grounded vision-language pre-training via aligning text and image regions","author":"Jin","year":"2023","journal-title":"arXiv:2305.14676"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58577-8_8"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.02156"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20077-9_7"},{"key":"ref50","article-title":"Grounding DINO: Marrying DINO with grounded pre-training for open-set object detection","author":"Liu","year":"2023","journal-title":"arXiv:2303.05499"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"ref52","article-title":"Decoupled weight decay regularization","author":"Loshchilov","year":"2017","journal-title":"arXiv:1711.05101"},{"key":"ref53","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.324"},{"key":"ref54","doi-asserted-by":"publisher","DOI":"10.1109\/TCYB.2021.3095305"},{"key":"ref55","volume-title":"Coco\u2014Common Objects in Context","year":"2024"},{"key":"ref56","doi-asserted-by":"publisher","DOI":"10.1007\/s11042-024-18872-y"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-72751-1_1"}],"container-title":["IEEE Access"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/6287639\/10380310\/10767696.pdf?arnumber=10767696","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,12,11]],"date-time":"2024-12-11T02:22:47Z","timestamp":1733883767000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10767696\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024]]},"references-count":57,"URL":"https:\/\/doi.org\/10.1109\/access.2024.3506563","relation":{},"ISSN":["2169-3536"],"issn-type":[{"value":"2169-3536","type":"electronic"}],"subject":[],"published":{"date-parts":[[2024]]}}}