@inproceedings{010873ea5e2047259b1c6804a4d65579,
title = "Disentangling Preference Representation and Text Generation for Efficient Individual Preference Alignment",
abstract = "Aligning Large Language Models (LLMs) with general human preferences has been proved crucial in improving the interaction quality between LLMs and human. However, human values are inherently diverse among different individuals, making it insufficient to align LLMs solely with general preferences. To address this, personalizing LLMs according to individual feedback emerges as a promising solution. Nonetheless, this approach presents challenges in terms of the efficiency of alignment algorithms. In this work, we introduce a flexible paradigm for individual preference alignment. Our method fundamentally improves efficiency by disentangling preference representation from text generation in LLMs. We validate our approach across multiple text generation tasks and demonstrate that it can produce aligned quality as well as or better than PEFT-based methods, while reducing additional training time for each new individual preference by 80\% to 90\% in comparison with them.",
author = "Jianfei Zhang and Jun Bai and Bei Li and Yanmeng Wang and Rumei Li and Chenghua Lin and Wenge Rong",
note = "Publisher Copyright: {\textcopyright} 2025 Association for Computational Linguistics.; 31st International Conference on Computational Linguistics, COLING 2025 ; Conference date: 19-01-2025 Through 24-01-2025",
year = "2025",
language = "英语",
series = "Proceedings - International Conference on Computational Linguistics, COLING",
publisher = "Association for Computational Linguistics (ACL)",
pages = "4813--4839",
editor = "Owen Rambow and Leo Wanner and Marianna Apidianaki and Hend Al-Khalifa and \{Di Eugenio\}, Barbara and Steven Schockaert",
booktitle = "Main Conference",
address = "澳大利亚",
}