@inproceedings{b1f79996fae24874b27227dbec1d7d4e,
title = "CIC-FL: Enabling Class Imbalance-Aware Clustered Federated Learning over Shifted Distributions",
abstract = "Federated learning (FL) is a distributed training framework where decentralized clients collaboratively train a model. One challenge in FL is concept shift, i.e. that the conditional distributions of data in different clients are disagreeing. A natural solution is to group clients with similar conditional distributions into the same cluster. However, methods following this approach leverage features extracted in federated settings (e.g., model weights or gradients) which intrinsically reflect the joint distributions of clients. Considering the difference between conditional and joint distributions, they would fail in the presence of class imbalance (i.e. that the marginal distributions of different classes vary in a client{\textquoteright}s data). Although adopting sampling techniques or cost-sensitive algorithms can alleviate class imbalance, they either skew the original conditional distributions or lead to privacy leakage. To address this challenge, we propose CIC-FL, a class imbalance-aware clustered federated learning method. CIC-FL iteratively bipartitions clients by leveraging a particular feature sensitive to concept shift but robust to class imbalance. In addition, CIC-FL is privacy-preserving and communication efficient. We test CIC-FL on benchmark datasets including Fashion-MNIST, CIFAR-10 and IMDB. The results show that CIC-FL outperforms state-of-the-art clustering methods in FL in the presence of class imbalance.",
keywords = "Class imbalance, Clustering, Concept shift, Federated learning",
author = "Yanan Fu and Xuefeng Liu and Shaojie Tang and Jianwei Niu and Zhangmin Huang",
note = "Publisher Copyright: {\textcopyright} 2021, Springer Nature Switzerland AG.; 26th International Conference on Database Systems for Advanced Applications, DASFAA 2021 ; Conference date: 11-04-2021 Through 14-04-2021",
year = "2021",
doi = "10.1007/978-3-030-73194-6\_3",
language = "英语",
isbn = "9783030731939",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "37--52",
editor = "Jensen, \{Christian S.\} and Ee-Peng Lim and De-Nian Yang and Wang-Chien Lee and Tseng, \{Vincent S.\} and Vana Kalogeraki and Jen-Wei Huang and Chih-Ya Shen",
booktitle = "Database Systems for Advanced Applications - 26th International Conference, DASFAA 2021, Proceedings",
address = "德国",
}