support export size setting

Former-commit-id: 1a4de54586c21cdbbc89f8a716ca5a54c87a6120
This commit is contained in:
hiyouga
2023-11-26 18:34:09 +08:00
parent 953a562ec1
commit 569860d7ac
4 changed files with 11 additions and 5 deletions

View File

@@ -34,7 +34,7 @@ def run_exp(args: Optional[Dict[str, Any]] = None, callbacks: Optional[List["Tra
raise ValueError("Unknown task.")
def export_model(args: Optional[Dict[str, Any]] = None, max_shard_size: Optional[str] = "10GB"):
def export_model(args: Optional[Dict[str, Any]] = None):
model_args, _, finetuning_args, _ = get_infer_args(args)
model, tokenizer = load_model_and_tokenizer(model_args, finetuning_args)
@@ -42,7 +42,7 @@ def export_model(args: Optional[Dict[str, Any]] = None, max_shard_size: Optional
raise ValueError("Cannot export a GPTQ quantized model.")
model.config.use_cache = True
model.save_pretrained(finetuning_args.export_dir, max_shard_size=max_shard_size)
model.save_pretrained(finetuning_args.export_dir, max_shard_size="{}GB".format(finetuning_args.export_size))
try:
tokenizer.padding_side = "left" # restore padding side