diff --git a/results/inference/Baichuan2-7B/Baichuan2_predict_1.yaml b/results/inference/Baichuan2-7B/Baichuan2_predict_1.yaml index 385b2634..f12fd9ff 100644 --- a/results/inference/Baichuan2-7B/Baichuan2_predict_1.yaml +++ b/results/inference/Baichuan2-7B/Baichuan2_predict_1.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: baichuan-inc/baichuan-7B +model_name_or_path: ../../llm/baichuan ### method do_predict: true diff --git a/results/inference/Baichuan2-7B/Baichuan2_predict_1_single.yaml b/results/inference/Baichuan2-7B/Baichuan2_predict_1_single.yaml index 8d889b2f..9ac8bb3c 100644 --- a/results/inference/Baichuan2-7B/Baichuan2_predict_1_single.yaml +++ b/results/inference/Baichuan2-7B/Baichuan2_predict_1_single.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: baichuan-inc/baichuan-7B +model_name_or_path: ../../llm/baichuan ### method do_predict: true diff --git a/results/inference/Baichuan2-7B/Baichuan2_predict_2.yaml b/results/inference/Baichuan2-7B/Baichuan2_predict_2.yaml index 553d870c..86c072fc 100644 --- a/results/inference/Baichuan2-7B/Baichuan2_predict_2.yaml +++ b/results/inference/Baichuan2-7B/Baichuan2_predict_2.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: baichuan-inc/baichuan-7B +model_name_or_path: ../../llm/baichuan ### method do_predict: true diff --git a/results/inference/Baichuan2-7B/Baichuan2_predict_2_single.yaml b/results/inference/Baichuan2-7B/Baichuan2_predict_2_single.yaml index cc133ba8..22bddb02 100644 --- a/results/inference/Baichuan2-7B/Baichuan2_predict_2_single.yaml +++ b/results/inference/Baichuan2-7B/Baichuan2_predict_2_single.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: baichuan-inc/baichuan-7B +model_name_or_path: ../../llm/baichuan ### method do_predict: true diff --git a/results/inference/Baichuan2-7B/Baichuan2_predict_3.yaml b/results/inference/Baichuan2-7B/Baichuan2_predict_3.yaml index cdd18be7..78c1d1b7 100644 --- a/results/inference/Baichuan2-7B/Baichuan2_predict_3.yaml +++ b/results/inference/Baichuan2-7B/Baichuan2_predict_3.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: baichuan-inc/baichuan-7B +model_name_or_path: ../../llm/baichuan ### method do_predict: true diff --git a/results/inference/Baichuan2-7B/Baichuan2_predict_3_single.yaml b/results/inference/Baichuan2-7B/Baichuan2_predict_3_single.yaml index e590d6ca..99f9305a 100644 --- a/results/inference/Baichuan2-7B/Baichuan2_predict_3_single.yaml +++ b/results/inference/Baichuan2-7B/Baichuan2_predict_3_single.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: baichuan-inc/baichuan-7B +model_name_or_path: ../../llm/baichuan ### method do_predict: true diff --git a/results/inference/Qwen-7B/Qwen_predict_1.yaml b/results/inference/Qwen-7B/Qwen_predict_1.yaml index e4c54c23..22fc846a 100644 --- a/results/inference/Qwen-7B/Qwen_predict_1.yaml +++ b/results/inference/Qwen-7B/Qwen_predict_1.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: qwen/Qwen-7B +model_name_or_path: ../../llm/qwen ### method do_predict: true diff --git a/results/inference/Qwen-7B/Qwen_predict_1_single.yaml b/results/inference/Qwen-7B/Qwen_predict_1_single.yaml index 1852598a..6d372817 100644 --- a/results/inference/Qwen-7B/Qwen_predict_1_single.yaml +++ b/results/inference/Qwen-7B/Qwen_predict_1_single.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: qwen/Qwen-7B +model_name_or_path: ../../llm/qwen ### method do_predict: true diff --git a/results/inference/Qwen-7B/Qwen_predict_2.yaml b/results/inference/Qwen-7B/Qwen_predict_2.yaml index 2cbde5fe..c6e936b2 100644 --- a/results/inference/Qwen-7B/Qwen_predict_2.yaml +++ b/results/inference/Qwen-7B/Qwen_predict_2.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: qwen/Qwen-7B +model_name_or_path: ../../llm/qwen ### method do_predict: true diff --git a/results/inference/Qwen-7B/Qwen_predict_2_single.yaml b/results/inference/Qwen-7B/Qwen_predict_2_single.yaml index c151ffdb..69a26e2f 100644 --- a/results/inference/Qwen-7B/Qwen_predict_2_single.yaml +++ b/results/inference/Qwen-7B/Qwen_predict_2_single.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: qwen/Qwen-7B +model_name_or_path: ../../llm/qwen ### method do_predict: true diff --git a/results/inference/Qwen-7B/Qwen_predict_3.yaml b/results/inference/Qwen-7B/Qwen_predict_3.yaml index 4f31cc9a..e4014295 100644 --- a/results/inference/Qwen-7B/Qwen_predict_3.yaml +++ b/results/inference/Qwen-7B/Qwen_predict_3.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: qwen/Qwen-7B +model_name_or_path: ../../llm/qwen ### method do_predict: true diff --git a/results/inference/Qwen-7B/Qwen_predict_3_single.yaml b/results/inference/Qwen-7B/Qwen_predict_3_single.yaml index a9f2c753..3935c3e9 100644 --- a/results/inference/Qwen-7B/Qwen_predict_3_single.yaml +++ b/results/inference/Qwen-7B/Qwen_predict_3_single.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: qwen/Qwen-7B +model_name_or_path: ../../llm/qwen ### method do_predict: true diff --git a/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_1.yaml b/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_1.yaml index f41903e8..2d72254d 100644 --- a/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_1.yaml +++ b/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_1.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: baichuan-inc/baichuan-7B +model_name_or_path: ../../llm/baichuan ### method stage: sft diff --git a/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_1_single.yaml b/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_1_single.yaml index c10638e7..a05c246b 100644 --- a/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_1_single.yaml +++ b/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_1_single.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: baichuan-inc/baichuan-7B +model_name_or_path: ../../llm/baichuan ### method stage: sft diff --git a/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_2.yaml b/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_2.yaml index 019b3fe0..6d2c1f49 100644 --- a/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_2.yaml +++ b/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_2.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: baichuan-inc/baichuan-7B +model_name_or_path: ../../llm/baichuan ### method stage: sft diff --git a/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_2_single.yaml b/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_2_single.yaml index c35cc67d..c0e80f6a 100644 --- a/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_2_single.yaml +++ b/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_2_single.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: baichuan-inc/baichuan-7B +model_name_or_path: ../../llm/baichuan ### method stage: sft diff --git a/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_3.yaml b/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_3.yaml index 6305a915..246ec950 100644 --- a/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_3.yaml +++ b/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_3.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: baichuan-inc/baichuan-7B +model_name_or_path: ../../llm/baichuan ### method stage: sft diff --git a/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_3_single.yaml b/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_3_single.yaml index c556d448..8d000a4e 100644 --- a/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_3_single.yaml +++ b/results/lora_sft/Baichuan2-7B/Baichuan2_lora_sft_3_single.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: baichuan-inc/baichuan-7B +model_name_or_path: ../../llm/baichuan ### method stage: sft diff --git a/results/lora_sft/Qwen-7B/Qwen_lora_sft_1.yaml b/results/lora_sft/Qwen-7B/Qwen_lora_sft_1.yaml index c8d6820f..cbb067f7 100644 --- a/results/lora_sft/Qwen-7B/Qwen_lora_sft_1.yaml +++ b/results/lora_sft/Qwen-7B/Qwen_lora_sft_1.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: qwen/Qwen-7B +model_name_or_path: ../../llm/qwen ### method stage: sft diff --git a/results/lora_sft/Qwen-7B/Qwen_lora_sft_1_single.yaml b/results/lora_sft/Qwen-7B/Qwen_lora_sft_1_single.yaml index add04a57..5a0cdb40 100644 --- a/results/lora_sft/Qwen-7B/Qwen_lora_sft_1_single.yaml +++ b/results/lora_sft/Qwen-7B/Qwen_lora_sft_1_single.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: qwen/Qwen-7B +model_name_or_path: ../../llm/qwen ### method stage: sft diff --git a/results/lora_sft/Qwen-7B/Qwen_lora_sft_2.yaml b/results/lora_sft/Qwen-7B/Qwen_lora_sft_2.yaml index 1196ca97..15100500 100644 --- a/results/lora_sft/Qwen-7B/Qwen_lora_sft_2.yaml +++ b/results/lora_sft/Qwen-7B/Qwen_lora_sft_2.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: qwen/Qwen-7B +model_name_or_path: ../../llm/qwen ### method stage: sft diff --git a/results/lora_sft/Qwen-7B/Qwen_lora_sft_2_single.yaml b/results/lora_sft/Qwen-7B/Qwen_lora_sft_2_single.yaml index 7f1aeac4..86bb1001 100644 --- a/results/lora_sft/Qwen-7B/Qwen_lora_sft_2_single.yaml +++ b/results/lora_sft/Qwen-7B/Qwen_lora_sft_2_single.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: qwen/Qwen-7B +model_name_or_path: ../../llm/qwen ### method stage: sft diff --git a/results/lora_sft/Qwen-7B/Qwen_lora_sft_3.yaml b/results/lora_sft/Qwen-7B/Qwen_lora_sft_3.yaml index 96c32ac4..8ff184cf 100644 --- a/results/lora_sft/Qwen-7B/Qwen_lora_sft_3.yaml +++ b/results/lora_sft/Qwen-7B/Qwen_lora_sft_3.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: qwen/Qwen-7B +model_name_or_path: ../../llm/qwen ### method stage: sft diff --git a/results/lora_sft/Qwen-7B/Qwen_lora_sft_3_single.yaml b/results/lora_sft/Qwen-7B/Qwen_lora_sft_3_single.yaml index da2464d6..1c761a8e 100644 --- a/results/lora_sft/Qwen-7B/Qwen_lora_sft_3_single.yaml +++ b/results/lora_sft/Qwen-7B/Qwen_lora_sft_3_single.yaml @@ -1,5 +1,5 @@ ### model -model_name_or_path: qwen/Qwen-7B +model_name_or_path: ../../llm/qwen ### method stage: sft diff --git a/src/gpu_status.py b/src/gpu_status.py index cabff59a..76154695 100644 --- a/src/gpu_status.py +++ b/src/gpu_status.py @@ -26,7 +26,7 @@ def main(): cur_time = time.strftime("%Y-%m-%d %H:%M:%S", time.localtime()), all_gpu_status = all_gpu_status ) - with open("./results/gpu_status.json", "a", encoding="utf-8") as f: + with open("./results/gpu_status_0821.json", "a", encoding="utf-8") as f: f.write(json.dumps(logs) + "\n") print(logs) time.sleep(60)