mirror of
https://github.com/QwenLM/Qwen.git
synced 2026-05-20 16:35:47 +08:00
add gradient checkpointing
This commit is contained in:
@@ -44,4 +44,5 @@ torchrun $DISTRIBUTED_ARGS finetune.py \
|
|||||||
--model_max_length 2048 \
|
--model_max_length 2048 \
|
||||||
--lazy_preprocess True \
|
--lazy_preprocess True \
|
||||||
--use_lora \
|
--use_lora \
|
||||||
|
--gradient_checkpointing \
|
||||||
--deepspeed finetune/ds_config_zero2.json
|
--deepspeed finetune/ds_config_zero2.json
|
||||||
@@ -32,4 +32,5 @@ python finetune.py \
|
|||||||
--report_to "none" \
|
--report_to "none" \
|
||||||
--model_max_length 2048 \
|
--model_max_length 2048 \
|
||||||
--lazy_preprocess True \
|
--lazy_preprocess True \
|
||||||
|
--gradient_checkpointing \
|
||||||
--use_lora
|
--use_lora
|
||||||
@@ -46,4 +46,5 @@ torchrun $DISTRIBUTED_ARGS finetune.py \
|
|||||||
--lazy_preprocess True \
|
--lazy_preprocess True \
|
||||||
--use_lora \
|
--use_lora \
|
||||||
--q_lora \
|
--q_lora \
|
||||||
|
--gradient_checkpointing \
|
||||||
--deepspeed finetune/ds_config_zero2.json
|
--deepspeed finetune/ds_config_zero2.json
|
||||||
@@ -32,5 +32,6 @@ python finetune.py \
|
|||||||
--report_to "none" \
|
--report_to "none" \
|
||||||
--model_max_length 2048 \
|
--model_max_length 2048 \
|
||||||
--lazy_preprocess True \
|
--lazy_preprocess True \
|
||||||
|
--gradient_checkpointing \
|
||||||
--use_lora \
|
--use_lora \
|
||||||
--q_lora
|
--q_lora
|
||||||
Reference in New Issue
Block a user