mirror of
https://github.com/QwenLM/Qwen.git
synced 2026-05-20 16:35:47 +08:00
Merge pull request #296 from QwenLM/features/add_finetuning
add gradient checkpointing
This commit is contained in:
@@ -44,4 +44,5 @@ torchrun $DISTRIBUTED_ARGS finetune.py \
|
||||
--model_max_length 2048 \
|
||||
--lazy_preprocess True \
|
||||
--use_lora \
|
||||
--gradient_checkpointing \
|
||||
--deepspeed finetune/ds_config_zero2.json
|
||||
@@ -32,4 +32,5 @@ python finetune.py \
|
||||
--report_to "none" \
|
||||
--model_max_length 2048 \
|
||||
--lazy_preprocess True \
|
||||
--gradient_checkpointing \
|
||||
--use_lora
|
||||
@@ -46,4 +46,5 @@ torchrun $DISTRIBUTED_ARGS finetune.py \
|
||||
--lazy_preprocess True \
|
||||
--use_lora \
|
||||
--q_lora \
|
||||
--gradient_checkpointing \
|
||||
--deepspeed finetune/ds_config_zero2.json
|
||||
@@ -32,5 +32,6 @@ python finetune.py \
|
||||
--report_to "none" \
|
||||
--model_max_length 2048 \
|
||||
--lazy_preprocess True \
|
||||
--gradient_checkpointing \
|
||||
--use_lora \
|
||||
--q_lora
|
||||
Reference in New Issue
Block a user