add ad gen dataset

This commit is contained in:
codemayq 2023-08-27 20:35:32 +08:00
parent ba94c8729d
commit 604f85487b
3 changed files with 12 additions and 0 deletions

View File

@ -105,6 +105,7 @@
- [Web QA (zh)](https://huggingface.co/datasets/suolyer/webqa)
- [UltraChat (en)](https://github.com/thunlp/UltraChat)
- [WebNovel (zh)](https://huggingface.co/datasets/zxbsmk/webnovel_cn)
- [Ad Gen (zh)](https://arxiv.org/abs/1908.06605)
- For reward modeling or DPO training:
- [HH-RLHF (en)](https://huggingface.co/datasets/Anthropic/hh-rlhf)
- [Open Assistant (multilingual)](https://huggingface.co/datasets/OpenAssistant/oasst1)

View File

@ -105,6 +105,7 @@
- [Web QA (zh)](https://huggingface.co/datasets/suolyer/webqa)
- [UltraChat (en)](https://github.com/thunlp/UltraChat)
- [WebNovel (zh)](https://huggingface.co/datasets/zxbsmk/webnovel_cn)
- [Ad Gen (zh)](https://arxiv.org/abs/1908.06605)
- 用于奖励模型或 DPO 训练:
- [HH-RLHF (en)](https://huggingface.co/datasets/Anthropic/hh-rlhf)
- [Open Assistant (multilingual)](https://huggingface.co/datasets/OpenAssistant/oasst1)

View File

@ -154,6 +154,16 @@
"hf_hub_url": "zxbsmk/webnovel_cn",
"stage": "sft"
},
"ad_gen": {
"hf_hub_url": "HasturOfficial/adgen",
"columns": {
"prompt": "content",
"query": "",
"response": "summary",
"history": ""
},
"stage": "sft"
},
"comparison_gpt4_en": {
"file_name": "comparison_gpt4_data_en.json",
"file_sha1": "96fa18313544e22444fe20eead7754b17da452ae",