@inproceedings{7c36d28282b341f09c2972cef0a1072c,
title = "PanFormer: A Transformer Based Model for Pan-Sharpening",
abstract = "Pan-sharpening aims at producing a high-resolution (HR) multi-spectral (MS) image from a low-resolution (LR) multi-spectral (MS) image and its corresponding panchromatic (PAN) image acquired by a same satellite. Inspired by a new fashion in recent deep learning community, we propose a novel Transformer based model for pan-sharpening. We explore the potential of Transformer in image feature extraction and fusion. Following the successful development of vision transformers, we design a two-stream network with the self-attention to extract the modality-specific features from the PAN and MS modalities and apply a cross-attention module to merge the spectral and spatial features. The pan-sharpened image is produced from the enhanced fused features. Extensive experiments on GaoFen-2 and WorldView-3 images demonstrate that our Transformer based model achieves impressive results and outperforms many existing CNN based methods, which shows the great potential of introducing Transformer to the pan-sharpening task. Codes are available at https://github.com/zhysora/PanFormer.",
keywords = "Pan-sharpening, attention mechanism, remote sensing, transformer",
author = "Huanyu Zhou and Qingjie Liu and Yunhong Wang",
note = "Publisher Copyright: {\textcopyright} 2022 IEEE.; 2022 IEEE International Conference on Multimedia and Expo, ICME 2022 ; Conference date: 18-07-2022 Through 22-07-2022",
year = "2022",
doi = "10.1109/ICME52920.2022.9859770",
language = "英语",
series = "Proceedings - IEEE International Conference on Multimedia and Expo",
publisher = "IEEE Computer Society",
booktitle = "ICME 2022 - IEEE International Conference on Multimedia and Expo 2022, Proceedings",
address = "美国",
}