diff --git a/README.md b/README.md index e98b18b0..b71303f2 100644 --- a/README.md +++ b/README.md @@ -437,6 +437,7 @@ accelerate launch src/train_bash.py # arguments (same as above) ```yaml compute_environment: LOCAL_MACHINE +debug: false distributed_type: MULTI_GPU downcast_bf16: 'no' gpu_ids: all diff --git a/README_zh.md b/README_zh.md index e00ff5a3..5c74e67a 100644 --- a/README_zh.md +++ b/README_zh.md @@ -437,6 +437,7 @@ accelerate launch src/train_bash.py # ε‚ζ•°εŒδΈŠ ```yaml compute_environment: LOCAL_MACHINE +debug: false distributed_type: MULTI_GPU downcast_bf16: 'no' gpu_ids: all diff --git a/src/llmtuner/webui/runner.py b/src/llmtuner/webui/runner.py index cfd6871b..66465057 100644 --- a/src/llmtuner/webui/runner.py +++ b/src/llmtuner/webui/runner.py @@ -144,7 +144,7 @@ class Runner: args["lora_target"] = get("train.lora_target") or get_module(get("top.model_name")) args["additional_target"] = get("train.additional_target") or None args["use_rslora"] = get("train.use_rslora") - if TRAINING_STAGES[get("train.training_stage")] in ["rm", "ppo", "dpo"]: + if args["stage"] in ["rm", "ppo", "dpo"]: args["create_new_adapter"] = args["quantization_bit"] is None else: args["create_new_adapter"] = get("train.create_new_adapter") @@ -166,7 +166,7 @@ class Runner: args["val_size"] = get("train.val_size") args["evaluation_strategy"] = "steps" args["eval_steps"] = get("train.save_steps") - args["load_best_model_at_end"] = True + args["load_best_model_at_end"] = args["stage"] not in ["rm", "ppo"] return args