{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,1]],"date-time":"2025-10-01T15:31:01Z","timestamp":1759332661687,"version":"3.28.0"},"reference-count":18,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,10,5]],"date-time":"2023-10-05T00:00:00Z","timestamp":1696464000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,10,5]],"date-time":"2023-10-05T00:00:00Z","timestamp":1696464000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,10,5]]},"DOI":"10.1109\/mapr59823.2023.10289072","type":"proceedings-article","created":{"date-parts":[[2023,10,26]],"date-time":"2023-10-26T13:50:46Z","timestamp":1698328246000},"page":"1-6","source":"Crossref","is-referenced-by-count":2,"title":["ViT-FFrCnt: A Few-shot Fruit Counting Approach with Multiscale Vision Transformer"],"prefix":"10.1109","author":[{"given":"Khanh-An C.","family":"Quan","sequence":"first","affiliation":[{"name":"University of Information Technology, VNU-HCM,Ho Chi Minh City,Vietnam"}]},{"given":"Huy Gia","family":"Vuong","sequence":"additional","affiliation":[{"name":"University of Science, VNU-HCM,Ho Chi Minh City,Vietnam"}]},{"given":"Minh-Triet","family":"Tran","sequence":"additional","affiliation":[{"name":"University of Science, VNU-HCM,Ho Chi Minh City,Vietnam"}]}],"member":"263","reference":[{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01553"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01196"},{"key":"ref15","article-title":"An Image is Worth 16x16 Words: Transformers for Image Recognition at Scale","author":"dosovitskiy","year":"2021","journal-title":"9th International Conference on Learning Representations ICLR 2021"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2017.7989417"},{"key":"ref11","article-title":"Deformable DETR: Deformable Transformers for End-to-End Object Detection","author":"zhu","year":"2021","journal-title":"9th International Conference on Learning Representations ICLR 2021"},{"journal-title":"YOLOv5 by Ultralytics Version 7 0","year":"2020","author":"jocher","key":"ref10"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1016\/j.compag.2022.107000"},{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.3390\/s17040905"},{"key":"ref17","doi-asserted-by":"crossref","first-page":"248","DOI":"10.1109\/CVPR.2009.5206848","article-title":"Imagenet: A large-scale hierarchical image database","author":"deng","year":"2009","journal-title":"2009 IEEE Conference on Computer Vision and Pattern Recognition"},{"key":"ref16","article-title":"Unified Perceptual Parsing for Scene Understanding","author":"xiao","year":"2018","journal-title":"European Conference on Computer Vision"},{"key":"ref18","article-title":"Decoupled Weight Decay Regularization","author":"loshchilov","year":"2017","journal-title":"International Conference on Learning Representations"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.322"},{"key":"ref7","first-page":"91","article-title":"Faster R-CNN: Towards RealTime Object Detection with Region Proposal Networks","author":"ren","year":"2015","journal-title":"NIPS"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.324"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1007\/s11704-021-1207-x"},{"key":"ref3","doi-asserted-by":"crossref","first-page":"107062","DOI":"10.1016\/j.compag.2022.107062","article-title":"Complete and accurate holly fruits counting using YOLOX object detection","volume":"198","author":"zhang","year":"2022","journal-title":"Computers and Electronics in Agriculture"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.3390\/s16081222"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1007\/s11432-021-3445-y"}],"event":{"name":"2023 International Conference on Multimedia Analysis and Pattern Recognition (MAPR)","start":{"date-parts":[[2023,10,5]]},"location":"Quy Nhon, Vietnam","end":{"date-parts":[[2023,10,6]]}},"container-title":["2023 International Conference on Multimedia Analysis and Pattern Recognition (MAPR)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10288584\/10288633\/10289072.pdf?arnumber=10289072","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,11,13]],"date-time":"2023-11-13T14:04:45Z","timestamp":1699884285000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10289072\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,10,5]]},"references-count":18,"URL":"https:\/\/doi.org\/10.1109\/mapr59823.2023.10289072","relation":{},"subject":[],"published":{"date-parts":[[2023,10,5]]}}}