diff --git a/deepspeed-telechat/sft/run_telechat_lora.sh b/deepspeed-telechat/sft/run_telechat_lora.sh index 49fac7c..8500387 100644 --- a/deepspeed-telechat/sft/run_telechat_lora.sh +++ b/deepspeed-telechat/sft/run_telechat_lora.sh @@ -47,7 +47,7 @@ deepspeed --master_port 29500 main.py \ --gradient_checkpointing \ --seed 42 \ --zero_stage $ZERO_STAGE \ - --save_steps 10 \ + --save_steps 100 \ --deepspeed \ --lora_dim 8 \ --mark_only_lora_as_trainable \