diff --git a/results/lora_sft_2/test/test1.yaml b/results/lora_sft_2/test/test1.yaml index 33701533..62bfe478 100644 --- a/results/lora_sft_2/test/test1.yaml +++ b/results/lora_sft_2/test/test1.yaml @@ -31,7 +31,7 @@ lr_scheduler_type: cosine warmup_ratio: 0.1 fp16: true ddp_timeout: 180000000 -max_steps: 100 +max_steps: 1000 include_num_input_tokens_seen: true include_tokens_per_second: true