forked from p04798526/LLaMA-Factory-Mirror
chore: change yaml and git ignore
This commit is contained in:
parent
c2b4a2db78
commit
7f5b10d654
|
@ -166,5 +166,5 @@ cache/
|
||||||
config/
|
config/
|
||||||
output/
|
output/
|
||||||
wandb/
|
wandb/
|
||||||
|
results/lora_sft
|
||||||
|
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_1
|
output_dir: ./results/lora_sft_2/Baichuan2-7B/Baichuan2_lora_sft_1
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_1_single
|
output_dir: ./results/lora_sft_2/Baichuan2-7B/Baichuan2_lora_sft_1_single
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_2
|
output_dir: ./results/lora_sft_2/Baichuan2-7B/Baichuan2_lora_sft_2
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_2_single
|
output_dir: ./results/lora_sft_2/Baichuan2-7B/Baichuan2_lora_sft_2_single
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_3
|
output_dir: ./results/lora_sft_2/Baichuan2-7B/Baichuan2_lora_sft_3
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_3_single
|
output_dir: ./results/lora_sft_2/Baichuan2-7B/Baichuan2_lora_sft_3_single
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/ChatGLM2-6B/ChatGLM2_lora_sft_1
|
output_dir: ./results/lora_sft_2/ChatGLM2-6B/ChatGLM2_lora_sft_1
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/ChatGLM2-6B/ChatGLM2_lora_sft_1_single
|
output_dir: ./results/lora_sft_2/ChatGLM2-6B/ChatGLM2_lora_sft_1_single
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/ChatGLM2-6B/ChatGLM2_lora_sft_2
|
output_dir: ./results/lora_sft_2/ChatGLM2-6B/ChatGLM2_lora_sft_2
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/ChatGLM2-6B/ChatGLM2_lora_sft_2_single
|
output_dir: ./results/lora_sft_2/ChatGLM2-6B/ChatGLM2_lora_sft_2_single
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/ChatGLM2-6B/ChatGLM2_lora_sft_3
|
output_dir: ./results/lora_sft_2/ChatGLM2-6B/ChatGLM2_lora_sft_3
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/ChatGLM2-6B/ChatGLM2_lora_sft_3_single
|
output_dir: ./results/lora_sft_2/ChatGLM2-6B/ChatGLM2_lora_sft_3_single
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/Llama2-7B/llama2_lora_sft_1
|
output_dir: ./results/lora_sft_2/Llama2-7B/llama2_lora_sft_1
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/Llama2-7B/llama2_lora_sft_1_single
|
output_dir: ./results/lora_sft_2/Llama2-7B/llama2_lora_sft_1_single
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/Llama2-7B/llama2_lora_sft_2
|
output_dir: ./results/lora_sft_2/Llama2-7B/llama2_lora_sft_2
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/Llama2-7B/llama2_lora_sft_2_single
|
output_dir: ./results/lora_sft_2/Llama2-7B/llama2_lora_sft_2_single
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/Llama2-7B/llama2_lora_sft_3
|
output_dir: ./results/lora_sft_2/Llama2-7B/llama2_lora_sft_3
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/Llama2-7B/llama2_lora_sft_3_single
|
output_dir: ./results/lora_sft_2/Llama2-7B/llama2_lora_sft_3_single
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/Qwen-7B/Qwen_lora_sft_1
|
output_dir: ./results/lora_sft_2/Qwen-7B/Qwen_lora_sft_1
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/Qwen-7B/Qwen_lora_sft_1_single
|
output_dir: ./results/lora_sft_2/Qwen-7B/Qwen_lora_sft_1_single
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/Qwen-7B/Qwen_lora_sft_2
|
output_dir: ./results/lora_sft_2/Qwen-7B/Qwen_lora_sft_2
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/Qwen-7B/Qwen_lora_sft_2_single
|
output_dir: ./results/lora_sft_2/Qwen-7B/Qwen_lora_sft_2_single
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/Qwen-7B/Qwen_lora_sft_3
|
output_dir: ./results/lora_sft_2/Qwen-7B/Qwen_lora_sft_3
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
|
@ -16,7 +16,7 @@ overwrite_cache: true
|
||||||
preprocessing_num_workers: 16
|
preprocessing_num_workers: 16
|
||||||
|
|
||||||
### output
|
### output
|
||||||
output_dir: ./results/lora_sft/Qwen-7B/Qwen_lora_sft_3_single
|
output_dir: ./results/lora_sft_2/Qwen-7B/Qwen_lora_sft_3_single
|
||||||
logging_steps: 3
|
logging_steps: 3
|
||||||
save_steps: 500
|
save_steps: 500
|
||||||
plot_loss: true
|
plot_loss: true
|
||||||
|
|
Loading…
Reference in New Issue