{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,22]],"date-time":"2025-10-22T22:37:21Z","timestamp":1761172641676,"version":"build-2065373602"},"reference-count":25,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,9,9]],"date-time":"2025-09-09T00:00:00Z","timestamp":1757376000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,9,9]],"date-time":"2025-09-09T00:00:00Z","timestamp":1757376000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,9,9]]},"DOI":"10.1109\/etfa65518.2025.11205775","type":"proceedings-article","created":{"date-parts":[[2025,10,21]],"date-time":"2025-10-21T17:07:47Z","timestamp":1761066467000},"page":"1-8","source":"Crossref","is-referenced-by-count":0,"title":["Applying Vision Transformers and Large Language Models to Anomaly Detection for Safer UAV Landings"],"prefix":"10.1109","author":[{"given":"Mohammad Reza Ranjbar","family":"Divkoti","sequence":"first","affiliation":[{"name":"University of Porto,SYSTEC-ARISE Research Center for Systems and Technologies, Faculty of Engineering,Porto,Portugal,4200-465"}]},{"given":"A. Pedro","family":"Aguiar","sequence":"additional","affiliation":[{"name":"University of Porto,SYSTEC-ARISE Research Center for Systems and Technologies, Faculty of Engineering,Porto,Portugal,4200-465"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1016\/j.engappai.2024.107961"},{"key":"ref2","first-page":"1","article-title":"An exploratory investigation of log anomalies in unmanned aerial vehicles","volume-title":"Proceedings of the IEEE\/ACM 46th International Conference on Software Engineering","author":"Wang"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/TCYB.2022.3213526"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1007\/s00500-025-10481-7"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/TIM.2024.3428649"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1007\/s10115-015-0845-4"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA.2019.8794286"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ISCC50000.2020.9219585"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.15607\/RSS.2024.XX.114"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2025.findings-naacl.333"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-73004-7_18"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1007\/s10514-023-10132-6"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20080-9_42"},{"article-title":"Video anomaly detection and explanation via large language models","year":"2024","author":"Lv","key":"ref14"},{"article-title":"Holmes-vad: Towards unbiased and explainable video anomaly detection via multi-modal llm","year":"2024","author":"Zhang","key":"ref15"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ICNS60906.2024.10550825"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/TR.2021.3134369"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICRA40945.2020.9197074"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/n19\u20131423"},{"article-title":"An image is worth 16x16 words: Transformers for image recognition at scale","year":"2020","author":"Dosovitskiy","key":"ref21"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01553"},{"key":"ref23","first-page":"249","article-title":"Understanding the difficulty of training deep feedforward neural networks","volume-title":"Proceedings of the thirteenth international conference on artificial intelligence and statistics","author":"Glorot"},{"article-title":"Decoupled weight decay regularization","year":"2017","author":"Loshchilov","key":"ref24"},{"article-title":"Mammut: A simple architecture for joint learning for multimodal tasks","year":"2023","author":"Kuo","key":"ref25"}],"event":{"name":"2025 IEEE 30th International Conference on Emerging Technologies and Factory Automation (ETFA)","start":{"date-parts":[[2025,9,9]]},"location":"Porto, Portugal","end":{"date-parts":[[2025,9,12]]}},"container-title":["2025 IEEE 30th International Conference on Emerging Technologies and Factory Automation (ETFA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11205475\/11205526\/11205775.pdf?arnumber=11205775","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,10,22]],"date-time":"2025-10-22T05:21:42Z","timestamp":1761110502000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11205775\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,9,9]]},"references-count":25,"URL":"https:\/\/doi.org\/10.1109\/etfa65518.2025.11205775","relation":{},"subject":[],"published":{"date-parts":[[2025,9,9]]}}}