Merge pull request #296 from QwenLM/features/add_finetuning

add gradient checkpointing
This commit is contained in:
Junyang Lin
2023-09-12 23:11:47 +08:00
committed by GitHub
4 changed files with 4 additions and 0 deletions

View File

@@ -44,4 +44,5 @@ torchrun $DISTRIBUTED_ARGS finetune.py \
--model_max_length 2048 \
--lazy_preprocess True \
--use_lora \
--gradient_checkpointing \
--deepspeed finetune/ds_config_zero2.json

View File

@@ -32,4 +32,5 @@ python finetune.py \
--report_to "none" \
--model_max_length 2048 \
--lazy_preprocess True \
--gradient_checkpointing \
--use_lora

View File

@@ -46,4 +46,5 @@ torchrun $DISTRIBUTED_ARGS finetune.py \
--lazy_preprocess True \
--use_lora \
--q_lora \
--gradient_checkpointing \
--deepspeed finetune/ds_config_zero2.json

View File

@@ -32,5 +32,6 @@ python finetune.py \
--report_to "none" \
--model_max_length 2048 \
--lazy_preprocess True \
--gradient_checkpointing \
--use_lora \
--q_lora