mirror of
https://github.com/QwenLM/Qwen.git
synced 2026-05-20 16:35:47 +08:00
Merge pull request #403 from QwenLM/JustinLin610-patch-2
Update finetune.py
This commit is contained in:
@@ -319,6 +319,10 @@ def train():
|
||||
tokenizer.pad_token_id = tokenizer.eod_id
|
||||
|
||||
if training_args.use_lora:
|
||||
if lora_args.q_lora:
|
||||
modules_to_save = None
|
||||
else:
|
||||
modules_to_save = ["wte", "lm_head"]
|
||||
lora_config = LoraConfig(
|
||||
r=lora_args.lora_r,
|
||||
lora_alpha=lora_args.lora_alpha,
|
||||
@@ -326,7 +330,7 @@ def train():
|
||||
lora_dropout=lora_args.lora_dropout,
|
||||
bias=lora_args.lora_bias,
|
||||
task_type="CAUSAL_LM",
|
||||
modules_to_save=["wte", "lm_head"] # This argument serves for adding new tokens.
|
||||
modules_to_save=modules_to_save # This argument serves for adding new tokens.
|
||||
)
|
||||
if lora_args.q_lora:
|
||||
model = prepare_model_for_kbit_training(
|
||||
|
||||
Reference in New Issue
Block a user