forked from super_cognition/zhuoshi_llm_factory
df192611e3 | ||
---|---|---|
.. | ||
dpo.sh | ||
orpo.sh | ||
ppo.sh | ||
predict.sh | ||
prepare.sh | ||
pretrain.sh | ||
reward.sh | ||
sft.sh | ||
sft_mllm.sh |
df192611e3 | ||
---|---|---|
.. | ||
dpo.sh | ||
orpo.sh | ||
ppo.sh | ||
predict.sh | ||
prepare.sh | ||
pretrain.sh | ||
reward.sh | ||
sft.sh | ||
sft_mllm.sh |