From 3448cf04de3d56aba17597b15307939e731abbf1 Mon Sep 17 00:00:00 2001 From: "hongliang.yuan" Date: Mon, 25 Aug 2025 17:17:40 +0800 Subject: [PATCH] use_reentrant to reduce memory --- nlp/llm/mixtral/openrlhf/train_sft_mixtral_lora.sh | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/nlp/llm/mixtral/openrlhf/train_sft_mixtral_lora.sh b/nlp/llm/mixtral/openrlhf/train_sft_mixtral_lora.sh index f702d4554..e60ba4dd6 100644 --- a/nlp/llm/mixtral/openrlhf/train_sft_mixtral_lora.sh +++ b/nlp/llm/mixtral/openrlhf/train_sft_mixtral_lora.sh @@ -22,7 +22,8 @@ openrlhf.cli.train_sft \ --learning_rate 5e-6 \ --lora_rank 64 \ --lora_alpha 64 \ - --aux_loss_coef 0.001 + --aux_loss_coef 0.001 \ + --gradient_checkpointing_use_reentrant EOF if [[ ${1} != "slurm" ]]; then -- Gitee