Merge pull request #4309 from EliMCosta/patch-1
Add Magpie and Webinstruct dataset samples
This commit is contained in:
commit
10316dd8ca
|
@ -270,6 +270,8 @@ You also can add a custom chat template to [template.py](src/llamafactory/data/t
|
||||||
- [Booksum (de)](https://huggingface.co/datasets/mayflowergmbh/booksum_de)
|
- [Booksum (de)](https://huggingface.co/datasets/mayflowergmbh/booksum_de)
|
||||||
- [Airoboros (de)](https://huggingface.co/datasets/mayflowergmbh/airoboros-3.0_de)
|
- [Airoboros (de)](https://huggingface.co/datasets/mayflowergmbh/airoboros-3.0_de)
|
||||||
- [Ultrachat (de)](https://huggingface.co/datasets/mayflowergmbh/ultra-chat_de)
|
- [Ultrachat (de)](https://huggingface.co/datasets/mayflowergmbh/ultra-chat_de)
|
||||||
|
- [WebInstructSub (en)](https://huggingface.co/datasets/TIGER-Lab/WebInstructSub)
|
||||||
|
- [Magpie-Pro-300K-Filtered (en)](https://huggingface.co/datasets/Magpie-Align/Magpie-Pro-300K-Filtered)
|
||||||
|
|
||||||
</details>
|
</details>
|
||||||
|
|
||||||
|
|
|
@ -270,6 +270,8 @@ https://github.com/hiyouga/LLaMA-Factory/assets/16256802/ec36a9dd-37f4-4f72-81bd
|
||||||
- [Booksum (de)](https://huggingface.co/datasets/mayflowergmbh/booksum_de)
|
- [Booksum (de)](https://huggingface.co/datasets/mayflowergmbh/booksum_de)
|
||||||
- [Airoboros (de)](https://huggingface.co/datasets/mayflowergmbh/airoboros-3.0_de)
|
- [Airoboros (de)](https://huggingface.co/datasets/mayflowergmbh/airoboros-3.0_de)
|
||||||
- [Ultrachat (de)](https://huggingface.co/datasets/mayflowergmbh/ultra-chat_de)
|
- [Ultrachat (de)](https://huggingface.co/datasets/mayflowergmbh/ultra-chat_de)
|
||||||
|
- [WebInstructSub (en)](https://huggingface.co/datasets/TIGER-Lab/WebInstructSub)
|
||||||
|
- [Magpie-Pro-300K-Filtered (en)](https://huggingface.co/datasets/Magpie-Align/Magpie-Pro-300K-Filtered)
|
||||||
|
|
||||||
</details>
|
</details>
|
||||||
|
|
||||||
|
|
|
@ -524,13 +524,13 @@
|
||||||
"prompt": "text"
|
"prompt": "text"
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
"fileweb": {
|
"fineweb": {
|
||||||
"hf_hub_url": "HuggingFaceFW/fineweb",
|
"hf_hub_url": "HuggingFaceFW/fineweb",
|
||||||
"columns": {
|
"columns": {
|
||||||
"prompt": "text"
|
"prompt": "text"
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
"fileweb_edu": {
|
"fineweb_edu": {
|
||||||
"hf_hub_url": "HuggingFaceFW/fineweb-edu",
|
"hf_hub_url": "HuggingFaceFW/fineweb-edu",
|
||||||
"columns": {
|
"columns": {
|
||||||
"prompt": "text"
|
"prompt": "text"
|
||||||
|
@ -550,5 +550,25 @@
|
||||||
"prompt": "content"
|
"prompt": "content"
|
||||||
},
|
},
|
||||||
"folder": "python"
|
"folder": "python"
|
||||||
|
},
|
||||||
|
"Magpie-Pro-300K-Filtered": {
|
||||||
|
"hf_hub_url": "Magpie-Align/Magpie-Pro-300K-Filtered",
|
||||||
|
"columns": {
|
||||||
|
"messages": "conversations"
|
||||||
|
},
|
||||||
|
"tags": {
|
||||||
|
"role_tag": "from",
|
||||||
|
"content_tag": "value",
|
||||||
|
"user_tag": "human",
|
||||||
|
"assistant_tag": "gpt"
|
||||||
|
},
|
||||||
|
"formatting": "sharegpt"
|
||||||
|
},
|
||||||
|
"WebInstructSub": {
|
||||||
|
"hf_hub_url": "TIGER-Lab/WebInstructSub",
|
||||||
|
"columns": {
|
||||||
|
"prompt": "question",
|
||||||
|
"response": "answer"
|
||||||
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
Loading…
Reference in New Issue