release v0.1.5

This commit is contained in:
hiyouga 2023-08-02 16:10:31 +08:00
parent 8ca01e53a8
commit c689857bbb
4 changed files with 27 additions and 19 deletions

View File

@ -196,6 +196,8 @@ CUDA_VISIBLE_DEVICES=0 python src/train_bash.py \
--fp16 --fp16
``` ```
Remember to specify `--lora_target W_pack` if you are using Baichuan models.
### Reward Model Training ### Reward Model Training
```bash ```bash

View File

@ -196,6 +196,8 @@ CUDA_VISIBLE_DEVICES=0 python src/train_bash.py \
--fp16 --fp16
``` ```
使用 Baichuan 模型时请指定 `--lora_target W_pack` 参数。
### 奖励模型训练 ### 奖励模型训练
```bash ```bash

View File

@ -1,4 +1,4 @@
from llmtuner.chat import ChatModel from llmtuner.chat import ChatModel
__version__ = "0.1.4" __version__ = "0.1.5"

View File

@ -46,34 +46,37 @@ class Template:
prefix = prefix + self.sep if prefix else "" # add separator for non-empty prefix prefix = prefix + self.sep if prefix else "" # add separator for non-empty prefix
history = history if (history and self.use_history) else [] history = history if (history and self.use_history) else []
history = history + [(query, "")] history = history + [(query, "")]
convs = [ return [
[(self.sep if turn_idx else prefix) + self.prompt.format(query=query_i), resp_i] [(self.sep if i else prefix) + self.prompt.format(query=q), r]
for turn_idx, (query_i, resp_i) in enumerate(history) for i, (q, r) in enumerate(history)
] ]
return convs
@dataclass
class Llama2Template(Template): class Llama2Template(Template):
def _format_example(self, query, history, prefix):
sys = prefix or self.prefix def _format_example(
if not sys.startswith("<<SYS>>\n"): self,
sys = f"<<SYS>>\n{sys.strip()}\n<</SYS>>\n\n" query: str,
history: Optional[List[Tuple[str, str]]] = None,
prefix: Optional[str] = ""
) -> List[Tuple[str, str]]:
prefix = prefix or self.prefix # use prefix if provided
prefix = prefix if prefix.startswith("<<SYS>>") else "<<SYS>>\n{}\n<</SYS>>\n\n".format(prefix)
history = history if (history and self.use_history) else [] history = history if (history and self.use_history) else []
history = history + [(query, "")] history = history + [(query, "")]
convs = [] return [
for turn_idx, (query_i, resp_i) in enumerate(history): [(self.sep if i else "") + self.prompt.format(query=(q if i else prefix + q)), r]
if turn_idx == 0: for i, (q, r) in enumerate(history)
convs.append([self.prompt.format(query=sys+query_i), resp_i]) ]
else:
convs.append([self.sep + self.prompt.format(query=query_i), resp_i])
return convs
templates: Dict[str, Template] = {} templates: Dict[str, Template] = {}
def register_template(name: str, prefix: str, prompt: str, sep: str, use_history: bool) -> None: def register_template(name: str, prefix: str, prompt: str, sep: str, use_history: bool) -> None:
templates[name] = Template( template_class = Llama2Template if name == "llama2" else Template
templates[name] = template_class(
prefix=prefix, prefix=prefix,
prompt=prompt, prompt=prompt,
sep=sep, sep=sep,
@ -117,7 +120,8 @@ Supports: https://huggingface.co/meta-llama/Llama-2-7b-chat-hf
https://huggingface.co/meta-llama/Llama-2-13b-chat-hf https://huggingface.co/meta-llama/Llama-2-13b-chat-hf
https://huggingface.co/meta-llama/Llama-2-70b-chat-hf https://huggingface.co/meta-llama/Llama-2-70b-chat-hf
""" """
templates["llama2"] = Llama2Template( register_template(
name="llama2",
prefix="<<SYS>>\nYou are a helpful, respectful and honest assistant. " prefix="<<SYS>>\nYou are a helpful, respectful and honest assistant. "
"Always answer as helpfully as possible, while being safe. " "Always answer as helpfully as possible, while being safe. "
"Your answers should not include any harmful, unethical, " "Your answers should not include any harmful, unethical, "
@ -126,7 +130,7 @@ templates["llama2"] = Llama2Template(
"If a question does not make any sense, or is not factually coherent, " "If a question does not make any sense, or is not factually coherent, "
"explain why instead of answering something not correct. " "explain why instead of answering something not correct. "
"If you don't know the answer to a question, please don't share false information.\n<</SYS>>\n\n", "If you don't know the answer to a question, please don't share false information.\n<</SYS>>\n\n",
prompt="[INST]{query}[/INST]", prompt="[INST] {query} [/INST] ",
sep="<s>", sep="<s>",
use_history=True use_history=True
) )