add stage in DatasetAttr
This commit is contained in:
parent
cece66d48a
commit
ba94c8729d
|
@ -11,6 +11,7 @@ class DatasetAttr:
|
||||||
dataset_name: Optional[str] = None
|
dataset_name: Optional[str] = None
|
||||||
dataset_sha1: Optional[str] = None
|
dataset_sha1: Optional[str] = None
|
||||||
system_prompt: Optional[str] = None
|
system_prompt: Optional[str] = None
|
||||||
|
stage: Optional[str] = None
|
||||||
|
|
||||||
def __repr__(self) -> str:
|
def __repr__(self) -> str:
|
||||||
return self.dataset_name
|
return self.dataset_name
|
||||||
|
@ -113,14 +114,21 @@ class DataArguments:
|
||||||
raise ValueError("Undefined dataset {} in dataset_info.json.".format(name))
|
raise ValueError("Undefined dataset {} in dataset_info.json.".format(name))
|
||||||
|
|
||||||
if "hf_hub_url" in dataset_info[name]:
|
if "hf_hub_url" in dataset_info[name]:
|
||||||
dataset_attr = DatasetAttr("hf_hub", dataset_name=dataset_info[name]["hf_hub_url"])
|
dataset_attr = DatasetAttr(
|
||||||
|
"hf_hub",
|
||||||
|
dataset_name=dataset_info[name]["hf_hub_url"],
|
||||||
|
stage=dataset_info[name].get("stage", None))
|
||||||
elif "script_url" in dataset_info[name]:
|
elif "script_url" in dataset_info[name]:
|
||||||
dataset_attr = DatasetAttr("script", dataset_name=dataset_info[name]["script_url"])
|
dataset_attr = DatasetAttr(
|
||||||
|
"script",
|
||||||
|
dataset_name=dataset_info[name]["script_url"],
|
||||||
|
stage=dataset_info[name].get("stage", None))
|
||||||
else:
|
else:
|
||||||
dataset_attr = DatasetAttr(
|
dataset_attr = DatasetAttr(
|
||||||
"file",
|
"file",
|
||||||
dataset_name=dataset_info[name]["file_name"],
|
dataset_name=dataset_info[name]["file_name"],
|
||||||
dataset_sha1=dataset_info[name].get("file_sha1", None)
|
dataset_sha1=dataset_info[name].get("file_sha1", None),
|
||||||
|
stage=dataset_info[name].get("stage", None)
|
||||||
)
|
)
|
||||||
|
|
||||||
if "columns" in dataset_info[name]:
|
if "columns" in dataset_info[name]:
|
||||||
|
|
Loading…
Reference in New Issue