Former-commit-id: 8608fa268cde5cddf8d0c6c2eb2cb5fa246c1831
This commit is contained in:
@@ -107,7 +107,7 @@ class ModelArguments:
|
||||
)
|
||||
vllm_maxlen: int = field(
|
||||
default=2048,
|
||||
metadata={"help": "Maximum sequence length of the vLLM engine (including prompt and output)."},
|
||||
metadata={"help": "Maximum sequence (prompt + response) length of the vLLM engine."},
|
||||
)
|
||||
vllm_gpu_util: float = field(
|
||||
default=0.9,
|
||||
|
||||
Reference in New Issue
Block a user