From eeb5249d0b6ce0816e1fa47afc3a853c7b267cbf Mon Sep 17 00:00:00 2001
From: Yuchen Han <42163912+hannlp@users.noreply.github.com>
Date: Fri, 17 Nov 2023 00:16:27 -0800
Subject: [PATCH] Update workflow.py

---
 src/llmtuner/train/ppo/workflow.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/llmtuner/train/ppo/workflow.py b/src/llmtuner/train/ppo/workflow.py
index 41a99e2c..4fb9d593 100644
--- a/src/llmtuner/train/ppo/workflow.py
+++ b/src/llmtuner/train/ppo/workflow.py
@@ -45,7 +45,7 @@ def run_ppo(
         mini_batch_size=training_args.per_device_train_batch_size,
         batch_size=training_args.per_device_train_batch_size * training_args.gradient_accumulation_steps,
         gradient_accumulation_steps=training_args.gradient_accumulation_steps,
-        ppo_epochs=1,
+        ppo_epochs=finetuning_args.ppo_epochs,
         max_grad_norm=training_args.max_grad_norm,
         seed=training_args.seed,
         optimize_device_cache=True,