Update model_args.py

Former-commit-id: f1e018587e5722e41962abd60f74043a3e55f692
This commit is contained in:
Xu Song
2024-05-31 14:35:48 +08:00
committed by GitHub
parent 070b944895
commit f2ae2cc04d

View File

@@ -107,7 +107,7 @@ class ModelArguments:
)
vllm_maxlen: int = field(
default=2048,
metadata={"help": "Maximum input length of the vLLM engine."},
metadata={"help": "Maximum sequence length of the vLLM engine (including prompt and output)."},
)
vllm_gpu_util: float = field(
default=0.9,