@inproceedings{9c68e4b22ab740c2875f5409d91160be,
title = "YOLOv4 RGBT Human Detection on Unmanned Aerial Vehicle Perspective",
abstract = "Analysis of visual drone images in various domains is increasing due to its ability to see the object from different perspectives and certain distant. Nowadays, small object detection from drones images is expected to overcome various environmental challenges such as illumination and motion change. Thermal infrared in addition to RGB images (RGBT) appears to undertake these challenges. Research on how this combination can give the best performance in object detection is still become attractive problem to be solved. In this study, The state of the art in object detection You Only Look Once (YOLO) v4 performance has been demonstrated by conducted three scenarios training methods in both RGB and thermal infrared (TIR) images dataset with unmanned aerial vehicle (UAV) perspective view. The dataset has been manually annotated to be compatible in YOLO format and the annotation will be release to the community. The pre-trained YOLO weight with minimal fine tuning also has been utilized to determine the transfer learning influence on the new aerial perspective dataset. The experimental result shows that with pre-trained model transfer learning from MS COCO dataset can improved the YOLOv4 human detection with Average Precision (AP) up to 91.18 % and 78.24 % in RGB and TIR dataset, respectively. ",
keywords = "Human detection, RGBT, small object, UAV, YOLO",
author = "Putri Shaniya and Grafika Jati and Alhamidi, {Machmud Roby} and Wahyu Caesarendra and Wisnu Jatmiko",
note = "Funding Information: I. INTRODUCTION Drone technology application has been significantly increased in recent years for a variety of uses such as surveillance and Search and Rescue (SAR) [1]. The eminent ability to give perspective view from top and the capability to reach challenging areas are the main contribution of drone popularity. Supported by the development of camera technology has been given improved quality of visual drone images. Despite the massive growth in quality, it is still facing environmental challenges such as illumination, weather conditions, motion blur and scale variation. RGBT (RGB and thermal infrared) images combination was emerging to overcome these challenges. Publisher Copyright: {\textcopyright} 2021 IEEE.; 6th International Workshop on Big Data and Information Security, IWBIS 2021 ; Conference date: 23-10-2021 Through 26-10-2021",
year = "2021",
doi = "10.1109/IWBIS53353.2021.9631856",
language = "English",
series = "Proceedings - IWBIS 2021: 6th International Workshop on Big Data and Information Security",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "41--46",
booktitle = "Proceedings - IWBIS 2021",
address = "United States",
}