@inproceedings{45693cde21b54d8db5c8bcb3f0024c10,
title = "U-YOLO: Improved YOLOv5 for Small Object Detection on UAV-Captured Images",
abstract = "Small object detection on drone-captured images is a recently popular and challenging task. From the drone{\textquoteright}s perspective, the object scale varies significantly, and tiny objects lack distinguishable appearance information in complex backgrounds, which leads to undesired effects. To solve the issue mentioned above, we propose U-YOLO based on the original YOLOv5 model. We first extend the multi-scale feature fusion network and add a detection head for tiny objects. Secondly, we integrate the convolutional block attention model (CBAM) in the detection head to focus on the critical region of the feature map. Lastly, an attention feature fusion module based on contextual information is designed to combine local and global contextual details of small objects and attention mechanisms to enhance the multi-scale feature fusion capability. Experiments on dataset VisDrone2021-DET show that U-YOLO not only improves the detection performance on drone-captured scenarios but also has a real-time detection speed. Compared to baseline model (YOLOv5s), the mAP result of U-YOLO is increased from 19.07 to 24.1\%, and the detection speed is 39FPS. It provides a good balance between detection accuracy and speed, promoting the progress of small object detection algorithms on UAV platforms.",
keywords = "Object detection, Small object detection, Unmanned aerial vehicle, Visual attention",
author = "Guowei Zhang and Xingyu Chen and Xun Tan and Jiahao Zhang and Xuguang Lan",
note = "Publisher Copyright: {\textcopyright} 2023, The Author(s), under exclusive license to Springer Nature Singapore Pte Ltd.; 1st International Conference on Cognitive Computation and Systems, ICCCS 2022 ; Conference date: 17-12-2022 Through 18-12-2022",
year = "2023",
doi = "10.1007/978-981-99-2789-0\_1",
language = "英语",
isbn = "9789819927883",
series = "Communications in Computer and Information Science",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "3--15",
editor = "Fuchun Sun and Jianmin Li and Huaping Liu and Zhongyi Chu",
booktitle = "Cognitive Computation and Systems - First International Conference, ICCCS 2022, Revised Selected Papers",
}