diff --git a/README.md b/README.md index 4495e697..141587fd 100644 --- a/README.md +++ b/README.md @@ -73,6 +73,7 @@ - [UltraChat](https://github.com/thunlp/UltraChat) - [Open Assistant](https://huggingface.co/datasets/OpenAssistant/oasst1) - [Open Assistant (Chinese)](https://huggingface.co/datasets/OpenAssistant/oasst1) + - [WebNovel (Chinese)](https://huggingface.co/datasets/zxbsmk/webnovel_cn) - For reward model training: - [HH-RLHF](https://huggingface.co/datasets/Anthropic/hh-rlhf) - [Open Assistant](https://huggingface.co/datasets/OpenAssistant/oasst1) diff --git a/data/dataset_info.json b/data/dataset_info.json index 5ad42e64..a4323e3b 100644 --- a/data/dataset_info.json +++ b/data/dataset_info.json @@ -149,5 +149,8 @@ "response": "", "history": "" } + }, + "novel_tokens512_50k": { + "hf_hub_url": "zxbsmk/webnovel_cn" } }