diff --git a/data/dataset_info.json b/data/dataset_info.json index d053be1d..18c4699a 100644 --- a/data/dataset_info.json +++ b/data/dataset_info.json @@ -73,6 +73,36 @@ "assistant_tag": "assistant" } }, + "llava_150k_en": { + "hf_hub_url": "BUAADreamer/llava-en-zh-300k", + "subset": "en", + "formatting": "sharegpt", + "columns": { + "messages": "messages", + "images": "images" + }, + "tags": { + "role_tag": "role", + "content_tag": "content", + "user_tag": "user", + "assistant_tag": "assistant" + } + }, + "llava_150k_zh": { + "hf_hub_url": "BUAADreamer/llava-en-zh-300k", + "subset": "zh", + "formatting": "sharegpt", + "columns": { + "messages": "messages", + "images": "images" + }, + "tags": { + "role_tag": "role", + "content_tag": "content", + "user_tag": "user", + "assistant_tag": "assistant" + } + }, "example": { "script_url": "example_dataset", "columns": {