add gradient checkpointing

This commit is contained in:
JustinLin610
2023-09-12 23:10:59 +08:00
parent c5f7fa9487
commit 73f4040abb
4 changed files with 4 additions and 0 deletions

View File

@@ -44,4 +44,5 @@ torchrun $DISTRIBUTED_ARGS finetune.py \
--model_max_length 2048 \ --model_max_length 2048 \
--lazy_preprocess True \ --lazy_preprocess True \
--use_lora \ --use_lora \
--gradient_checkpointing \
--deepspeed finetune/ds_config_zero2.json --deepspeed finetune/ds_config_zero2.json

View File

@@ -32,4 +32,5 @@ python finetune.py \
--report_to "none" \ --report_to "none" \
--model_max_length 2048 \ --model_max_length 2048 \
--lazy_preprocess True \ --lazy_preprocess True \
--gradient_checkpointing \
--use_lora --use_lora

View File

@@ -46,4 +46,5 @@ torchrun $DISTRIBUTED_ARGS finetune.py \
--lazy_preprocess True \ --lazy_preprocess True \
--use_lora \ --use_lora \
--q_lora \ --q_lora \
--gradient_checkpointing \
--deepspeed finetune/ds_config_zero2.json --deepspeed finetune/ds_config_zero2.json

View File

@@ -32,5 +32,6 @@ python finetune.py \
--report_to "none" \ --report_to "none" \
--model_max_length 2048 \ --model_max_length 2048 \
--lazy_preprocess True \ --lazy_preprocess True \
--gradient_checkpointing \
--use_lora \ --use_lora \
--q_lora --q_lora