llama3_lora_dpo.yaml
|
update train hparams
|
2024-06-06 01:49:20 +08:00 |
llama3_lora_eval.yaml
|
update examples
|
2024-05-17 01:02:00 +08:00 |
llama3_lora_kto.yaml
|
update train hparams
|
2024-06-06 01:49:20 +08:00 |
llama3_lora_ppo.yaml
|
fix #4005 #4013
|
2024-06-03 19:12:29 +08:00 |
llama3_lora_pretrain.yaml
|
update train hparams
|
2024-06-06 01:49:20 +08:00 |
llama3_lora_reward.yaml
|
update train hparams
|
2024-06-06 01:49:20 +08:00 |
llama3_lora_sft.yaml
|
update train hparams
|
2024-06-06 01:49:20 +08:00 |
llama3_preprocess.yaml
|
improve KTO impl., replace datasets
|
2024-05-18 03:44:56 +08:00 |
llava1_5_lora_sft.yaml
|
update train hparams
|
2024-06-06 01:49:20 +08:00 |