mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2025-12-14 19:06:26 +08:00
@@ -107,7 +107,7 @@ class ModelArguments:
|
|||||||
)
|
)
|
||||||
vllm_maxlen: int = field(
|
vllm_maxlen: int = field(
|
||||||
default=2048,
|
default=2048,
|
||||||
metadata={"help": "Maximum input length of the vLLM engine."},
|
metadata={"help": "Maximum sequence length of the vLLM engine (including prompt and output)."},
|
||||||
)
|
)
|
||||||
vllm_gpu_util: float = field(
|
vllm_gpu_util: float = field(
|
||||||
default=0.9,
|
default=0.9,
|
||||||
|
|||||||
Reference in New Issue
Block a user