mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2025-12-29 18:20:35 +08:00
[model] update kt code (#9406)
This commit is contained in:
@@ -485,7 +485,9 @@ class KTransformersArguments:
|
||||
)
|
||||
kt_optimize_rule: Optional[str] = field(
|
||||
default=None,
|
||||
metadata={"help": "Path To The KTransformers Optimize Rule; See https://github.com/kvcache-ai/ktransformers/."},
|
||||
metadata={
|
||||
"help": "Path To The KTransformers Optimize Rule; See https://github.com/kvcache-ai/ktransformers/."
|
||||
},
|
||||
)
|
||||
cpu_infer: Optional[int] = field(
|
||||
default=32,
|
||||
@@ -517,9 +519,16 @@ class KTransformersArguments:
|
||||
metadata={"help": "Force-Think Toggle For The KT Engine."},
|
||||
)
|
||||
|
||||
|
||||
@dataclass
|
||||
class ModelArguments(
|
||||
SGLangArguments, VllmArguments, KTransformersArguments, ExportArguments, ProcessorArguments, QuantizationArguments, BaseModelArguments
|
||||
SGLangArguments,
|
||||
VllmArguments,
|
||||
KTransformersArguments,
|
||||
ExportArguments,
|
||||
ProcessorArguments,
|
||||
QuantizationArguments,
|
||||
BaseModelArguments,
|
||||
):
|
||||
r"""Arguments pertaining to which model/config/tokenizer we are going to fine-tune or infer.
|
||||
|
||||
|
||||
Reference in New Issue
Block a user