From c689857bbb82ecaa317bfc22d831c7025fe39cc7 Mon Sep 17 00:00:00 2001
From: hiyouga <hiyouga@buaa.edu.cn>
Date: Wed, 2 Aug 2023 16:10:31 +0800
Subject: [PATCH] release v0.1.5

---
 README.md                       |  2 ++
 README_zh.md                    |  2 ++
 src/llmtuner/__init__.py        |  2 +-
 src/llmtuner/extras/template.py | 40 ++++++++++++++++++---------------
 4 files changed, 27 insertions(+), 19 deletions(-)
diff --git a/README.md b/README.md
index 6674fe71..9758079c 100644
--- a/README.md
+++ b/README.md
@@ -196,6 +196,8 @@ CUDA_VISIBLE_DEVICES=0 python src/train_bash.py \
     --fp16
 ```
 
+Remember to specify `--lora_target W_pack` if you are using Baichuan models.
+
 ### Reward Model Training
 
 ```bash
diff --git a/README_zh.md b/README_zh.md
index 125e278d..ae2ad81b 100644
--- a/README_zh.md
+++ b/README_zh.md
@@ -196,6 +196,8 @@ CUDA_VISIBLE_DEVICES=0 python src/train_bash.py \
     --fp16
 ```
 
+使用 Baichuan 模型时请指定 `--lora_target W_pack` 参数。
+
 ### 奖励模型训练
 
 ```bash
diff --git a/src/llmtuner/__init__.py b/src/llmtuner/__init__.py
index 7ce46808..b3b28109 100644
--- a/src/llmtuner/__init__.py
+++ b/src/llmtuner/__init__.py
@@ -1,4 +1,4 @@
 from llmtuner.chat import ChatModel
 
 
-__version__ = "0.1.4"
+__version__ = "0.1.5"
diff --git a/src/llmtuner/extras/template.py b/src/llmtuner/extras/template.py
index 567b9102..cc3f2b1d 100644
--- a/src/llmtuner/extras/template.py
+++ b/src/llmtuner/extras/template.py
@@ -46,34 +46,37 @@ class Template:
         prefix = prefix + self.sep if prefix else "" # add separator for non-empty prefix
         history = history if (history and self.use_history) else []
         history = history + [(query, "")]
-        convs = [
-            [(self.sep if turn_idx else prefix) + self.prompt.format(query=query_i), resp_i]
-            for turn_idx, (query_i, resp_i) in enumerate(history)
+        return [
+            [(self.sep if i else prefix) + self.prompt.format(query=q), r]
+            for i, (q, r) in enumerate(history)
         ]
-        return convs
 
 
+@dataclass
 class Llama2Template(Template):
-    def _format_example(self, query, history, prefix):
-        sys = prefix or self.prefix
-        if not sys.startswith("<<SYS>>\n"):
-            sys = f"<<SYS>>\n{sys.strip()}\n<</SYS>>\n\n"
+
+    def _format_example(
+        self,
+        query: str,
+        history: Optional[List[Tuple[str, str]]] = None,
+        prefix: Optional[str] = ""
+    ) -> List[Tuple[str, str]]:
+        prefix = prefix or self.prefix # use prefix if provided
+        prefix = prefix if prefix.startswith("<<SYS>>") else "<<SYS>>\n{}\n<</SYS>>\n\n".format(prefix)
         history = history if (history and self.use_history) else []
         history = history + [(query, "")]
-        convs = []
-        for turn_idx, (query_i, resp_i) in enumerate(history):
-            if turn_idx == 0:
-                convs.append([self.prompt.format(query=sys+query_i), resp_i])
-            else:
-                convs.append([self.sep + self.prompt.format(query=query_i), resp_i])
-        return convs
+        return [
+            [(self.sep if i else "") + self.prompt.format(query=(q if i else prefix + q)), r]
+            for i, (q, r) in enumerate(history)
+        ]
 
 
 templates: Dict[str, Template] = {}
 
 
 def register_template(name: str, prefix: str, prompt: str, sep: str, use_history: bool) -> None:
-    templates[name] = Template(
+    template_class = Llama2Template if name == "llama2" else Template
+    templates[name] = template_class(
         prefix=prefix,
         prompt=prompt,
         sep=sep,
@@ -117,7 +120,8 @@ Supports: https://huggingface.co/meta-llama/Llama-2-7b-chat-hf
           https://huggingface.co/meta-llama/Llama-2-13b-chat-hf
           https://huggingface.co/meta-llama/Llama-2-70b-chat-hf
 """
-templates["llama2"] = Llama2Template(
+register_template(
+    name="llama2",
     prefix="<<SYS>>\nYou are a helpful, respectful and honest assistant. "
            "Always answer as helpfully as possible, while being safe.  "
            "Your answers should not include any harmful, unethical, "
@@ -126,7 +130,7 @@ templates["llama2"] = Llama2Template(
            "If a question does not make any sense, or is not factually coherent, "
            "explain why instead of answering something not correct. "
            "If you don't know the answer to a question, please don't share false information.\n<</SYS>>\n\n",
-    prompt="[INST]{query}[/INST]",
+    prompt="[INST] {query} [/INST] ",
     sep="<s>",
     use_history=True
 )