support export push_to_hub #2183
This commit is contained in:
parent
a83fb6d3ff
commit
42859f0734
|
@ -106,6 +106,10 @@ class ModelArguments:
|
||||||
default=False,
|
default=False,
|
||||||
metadata={"help": "Whether or not to save the `.bin` files instead of `.safetensors`."}
|
metadata={"help": "Whether or not to save the `.bin` files instead of `.safetensors`."}
|
||||||
)
|
)
|
||||||
|
export_hub_model_id: Optional[str] = field(
|
||||||
|
default=None,
|
||||||
|
metadata={"help": "The name of the repository if push the model to the Hugging Face hub."}
|
||||||
|
)
|
||||||
|
|
||||||
def __post_init__(self):
|
def __post_init__(self):
|
||||||
self.compute_dtype = None
|
self.compute_dtype = None
|
||||||
|
|
|
@ -50,7 +50,7 @@ def export_model(args: Optional[Dict[str, Any]] = None):
|
||||||
if not isinstance(model, PreTrainedModel):
|
if not isinstance(model, PreTrainedModel):
|
||||||
raise ValueError("The model is not a `PreTrainedModel`, export aborted.")
|
raise ValueError("The model is not a `PreTrainedModel`, export aborted.")
|
||||||
|
|
||||||
model.config.use_cache = True
|
setattr(model.config, "use_cache", True)
|
||||||
if getattr(model.config, "torch_dtype", None) == "bfloat16":
|
if getattr(model.config, "torch_dtype", None) == "bfloat16":
|
||||||
model = model.to(torch.bfloat16).to("cpu")
|
model = model.to(torch.bfloat16).to("cpu")
|
||||||
else:
|
else:
|
||||||
|
@ -62,11 +62,20 @@ def export_model(args: Optional[Dict[str, Any]] = None):
|
||||||
max_shard_size="{}GB".format(model_args.export_size),
|
max_shard_size="{}GB".format(model_args.export_size),
|
||||||
safe_serialization=(not model_args.export_legacy_format)
|
safe_serialization=(not model_args.export_legacy_format)
|
||||||
)
|
)
|
||||||
|
if model_args.export_hub_model_id is not None:
|
||||||
|
model.push_to_hub(
|
||||||
|
model_args.export_hub_model_id,
|
||||||
|
token=model_args.hf_hub_token,
|
||||||
|
max_shard_size="{}GB".format(model_args.export_size),
|
||||||
|
safe_serialization=(not model_args.export_legacy_format)
|
||||||
|
)
|
||||||
|
|
||||||
try:
|
try:
|
||||||
tokenizer.padding_side = "left" # restore padding side
|
tokenizer.padding_side = "left" # restore padding side
|
||||||
tokenizer.init_kwargs["padding_side"] = "left"
|
tokenizer.init_kwargs["padding_side"] = "left"
|
||||||
tokenizer.save_pretrained(model_args.export_dir)
|
tokenizer.save_pretrained(model_args.export_dir)
|
||||||
|
if model_args.export_hub_model_id is not None:
|
||||||
|
tokenizer.push_to_hub(model_args.export_hub_model_id, token=model_args.hf_hub_token)
|
||||||
except:
|
except:
|
||||||
logger.warning("Cannot save tokenizer, please copy the files manually.")
|
logger.warning("Cannot save tokenizer, please copy the files manually.")
|
||||||
|
|
||||||
|
|
Loading…
Reference in New Issue