Former-commit-id: 416f6333f66b6afd70a3a936d82593efca583235
This commit is contained in:
hiyouga
2024-03-07 16:15:53 +08:00
parent 3de642bffd
commit 9a69cadab3
4 changed files with 41 additions and 30 deletions

View File

@@ -286,9 +286,9 @@ def patch_config(
init_kwargs["torch_dtype"] = model_args.compute_dtype
if not is_deepspeed_zero3_enabled():
init_kwargs["low_cpu_mem_usage"] = True
if "device_map" not in init_kwargs:
init_kwargs["device_map"] = {"": get_current_device()} if is_trainable else "auto"
init_kwargs["low_cpu_mem_usage"] = model_args.low_cpu_mem_usage
if "device_map" not in init_kwargs: # quant models cannot use auto device map
init_kwargs["device_map"] = model_args.device_map or {"": get_current_device()}
def patch_model(