@inproceedings{95e3162a84154a92bed5ea89cf83fa3f,
title = "LasQ: Largest Singular Components Fine-Tuning for LLMs with Quantization",
abstract = "Large language models (LLMs) have demonstrated strong capabilities in various industries, but as the model parameters increase, the computational cost of fine-tuning the entire model becomes extremely high. To address this challenge, we focus on applying quantization and LoRA fine-tuning together in pre-training scenarios and propose an efficient parameter fine-tuning (PEFT) method, the LasQ (Largest Singular Components Fine-tuning for LLMs with Quantization) framework. Performs singular value decomposition on the pre-trained weights after quantization, using high-order singular value components to initialize the low rank adapter. We evaluate our method in natural language understanding, question answering, summarization, and natural language generation tasks. The experiments show that our method can significantly outperform existing methods with fewer training parameters. Compared with LoftQ and QLoRA methods, it has a 2\%–15\% improvement, and it can even achieve equivalent LoRA fine-tuning effects and full parameter fine-tuning effects.",
keywords = "Finetune, LLMs, Quantization",
author = "Xiang Zhao and Beining Lin and You Song",
note = "Publisher Copyright: {\textcopyright} The Author(s), under exclusive license to Springer Nature Singapore Pte Ltd. 2025.; 13th CCF International Conference on Natural Language Processing and Chinese Computing, NLPCC 2024 ; Conference date: 01-11-2024 Through 03-11-2024",
year = "2025",
doi = "10.1007/978-981-97-9437-9\_4",
language = "英语",
isbn = "9789819794362",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "42--54",
editor = "Wong, \{Derek F.\} and Zhongyu Wei and Muyun Yang",
booktitle = "Natural Language Processing and Chinese Computing - 13th National CCF Conference, NLPCC 2024, Proceedings",
address = "德国",
}