@inproceedings{e4e75fc7f9524dd3ab5d7af61366c831,
title = "FFT-based Appearance Adaptation for the Semantic Segmentation of Small-scale Aerial Image Datasets",
abstract = "Modern semantic segmentation models, which enable useful applications based on aerial image analysis such as tracking deforestation of the Amazon rainforest over time, rely on access to large amounts of training data. However, due to the cost of manually labeling data, segmentation datasets, including aerial image datasets, are often relatively small. In many cases, no labels are available at all and domain adaptation from a related domain has to be performed. Since many domain adaptation approaches are specialized for the adaptation of street scene segmentation, we propose an alternate domain adaptation pipeline taking the properties of aerial image datasets into account. We propose a novel appearance adaptation technique using statistics (mean and covariance) of coefficients in the frequency domain and transferring the statistics from one domain to another to copy its look/style. In an experiment with 30 domain pairs, we achieved an average improvement of 2.5% mean F1 score. We improve upon the state of the art by 13.3%.",
keywords = "Aerial Images, Appearance Adaptation, Domain Adaptation, Semantic Segmentation",
author = "Daniel Gritzner and Sven Ysker and J{\"o}rn Ostermann",
note = "Publisher Copyright: {\textcopyright} 2026 SPIE.; 18th International Conference on Machine Vision, ICMV 2025, ICMV 2025 ; Conference date: 19-10-2025 Through 22-10-2025",
year = "2026",
month = feb,
day = "25",
doi = "10.1117/12.3093986",
language = "English",
series = "Proceedings of SPIE - The International Society for Optical Engineering",
publisher = "SPIE",
editor = "Wolfgang Osten",
booktitle = "Eighteenth International Conference on Machine Vision, ICMV 2025",
address = "United States",
}