[fix] correct ktransformers example config paths and templates (#9732)

This commit is contained in:
Peilin Li
2026-01-08 10:52:50 +08:00
committed by GitHub
parent 5cfd804b59
commit 03a70ba8dd
7 changed files with 12 additions and 12 deletions

View File

@@ -1,9 +1,9 @@
model_name_or_path: opensourcerelease/DeepSeek-V3-bf16
template: deepseek
template: deepseek3
infer_backend: ktransformers # choices: [huggingface, vllm, sglang, ktransformers]
trust_remote_code: true
use_kt: true # use KTransformers as LoRA sft backend to inference
kt_optimize_rule: examples/kt_optimize_rules/DeepSeek-V3-Chat-sft-amx-multi-gpu.yaml
kt_optimize_rule: examples/ktransformers/kt_optimize_rules/DeepSeek-V3-Chat-sft-amx-multi-gpu.yaml
cpu_infer: 32
chunk_size: 8192