Merge pull request #296 from QwenLM/features/add_finetuning

add gradient checkpointing
main
Junyang Lin 2 years ago committed by GitHub
commit fcb36b7a94
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

@ -44,4 +44,5 @@ torchrun $DISTRIBUTED_ARGS finetune.py \
--model_max_length 2048 \
--lazy_preprocess True \
--use_lora \
--gradient_checkpointing \
--deepspeed finetune/ds_config_zero2.json

@ -32,4 +32,5 @@ python finetune.py \
--report_to "none" \
--model_max_length 2048 \
--lazy_preprocess True \
--gradient_checkpointing \
--use_lora

@ -46,4 +46,5 @@ torchrun $DISTRIBUTED_ARGS finetune.py \
--lazy_preprocess True \
--use_lora \
--q_lora \
--gradient_checkpointing \
--deepspeed finetune/ds_config_zero2.json

@ -32,5 +32,6 @@ python finetune.py \
--report_to "none" \
--model_max_length 2048 \
--lazy_preprocess True \
--gradient_checkpointing \
--use_lora \
--q_lora
Loading…
Cancel
Save