@inproceedings{010ac9b72f92489581814b8d4b8a1e61,
title = "Diffusion-Geo: A Two-Stage Controllable Text-To-Image Generative Model for Remote Sensing Scenarios",
abstract = "Image generation is a crucial task to facilitate intelligent interpretation in remote sensing domain. Expanding dataset size through image generation can enhance model performance of downtown task. However, current generative models in remote sensing are mostly unconditional or guided by simple text, resulting in generated images lacking spatial and semantic constraints. This lack of control can negatively optimize downstream task models. To tackle these challenges, a two-stage controllable text-image generative model called Diffusion-Geo is presented. In the first stage, an extensive image-text generation dataset called RS-Control is created through prompt engineering of multimodal large language models (MLLMs) and manual prompts for existing datasets, incorporates diverse conditional controls with rich spatial and semantic information. Then RS-Control dataset is utilized to train a universal controllable image generative model. The second stage involves efficient tuning the universal model for different task datasets, minimizing fine-tuning costs while preserving diversity and high-quality features. Experiments conducted on the RSICD caption dataset and WHU change detection dataset demonstrate the superiority of Diffusion-Geo over other state-of-the-art models in image generation.",
keywords = "controllable text-to-image generation, diffusion, remote sensing",
author = "Miaoxin Cai and Wei Zhang and Tong Zhang and Yin Zhuang and He Chen and Liang Chen and Can Li",
note = "Publisher Copyright: {\textcopyright} 2024 IEEE.; 2024 IEEE International Geoscience and Remote Sensing Symposium, IGARSS 2024 ; Conference date: 07-07-2024 Through 12-07-2024",
year = "2024",
doi = "10.1109/IGARSS53475.2024.10641523",
language = "English",
series = "International Geoscience and Remote Sensing Symposium (IGARSS)",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "7003--7006",
booktitle = "IGARSS 2024 - 2024 IEEE International Geoscience and Remote Sensing Symposium, Proceedings",
address = "United States",
}