@inproceedings{c7678508047e4969bf01807c8273dfb1,
title = "SIAM-WFEF: Small target tracking network based on wavelet pooling layer and frequency band enhancement and fusion",
abstract = "Unmanned aerial vehicles (UAVs) are increasingly used for target tracking, but long-distance/high-altitude imaging often yields tiny, blurred targets with few pixels. Conventional feature extraction struggles to capture local details and discriminative cues, making targets vulnerable to background interference and reducing tracking accuracy. This paper proposes Siam-WFEF, a Siamese network-based tracker featuring two synergistic modules: Wavelet Pooling Layer (WPL) and Frequency Band Enhancement and Fusion (FBEF). WPL replaces traditional pooling by applying the Discrete Wavelet Transform to decompose feature maps into low- and high-frequency sub-bands, preserving critical details of small targets. FBEF then refines each sub-band and adaptively fuses the enhanced frequency features, jointly suppressing background clutter while amplifying target cues. Extensive experiments on UAV123, DTB70, and VisDrone2019-SOT demonstrate that Siam-WFEF achieves significant performance gains over mainstream trackers, particularly for small targets under challenging conditions.",
keywords = "Siamese network, UAV vision, frequency fusion, small target tracking, wavelet pooling",
author = "Yaomiao Meng and Yuqi Han and Linbo Tang and Qiuyu Jin and Sharan Thapa",
note = "Publisher Copyright: {\textcopyright} 2026 SPIE.; International Conference on Machine Learning and Artificial Intelligence Applications, MLAIA 2025 ; Conference date: 12-12-2025 Through 14-12-2025",
year = "2026",
month = mar,
day = "9",
doi = "10.1117/12.3110411",
language = "English",
series = "Proceedings of SPIE - The International Society for Optical Engineering",
publisher = "SPIE",
editor = "Jianhua Zhou",
booktitle = "International Conference on Machine Learning and Artificial Intelligence Applications, MLAIA 2025",
address = "United States",
}