support batch infer in vllm

Former-commit-id: 1324d158f9
This commit is contained in:
hiyouga
2024-12-04 13:50:00 +00:00
parent b2c67a989a
commit 235cdcacee
29 changed files with 148 additions and 407 deletions

View File

@@ -1,2 +1,3 @@
model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
template: llama3
infer_backend: huggingface # choices: [huggingface, vllm]

View File

@@ -2,3 +2,4 @@ model_name_or_path: meta-llama/Meta-Llama-3-8B-Instruct
adapter_name_or_path: saves/llama3-8b/lora/sft
template: llama3
finetuning_type: lora
infer_backend: huggingface # choices: [huggingface, vllm]

View File

@@ -1,2 +1,3 @@
model_name_or_path: llava-hf/llava-1.5-7b-hf
template: llava
infer_backend: huggingface # choices: [huggingface, vllm]

View File

@@ -1,2 +1,3 @@
model_name_or_path: Qwen/Qwen2-VL-7B-Instruct
template: qwen2_vl
infer_backend: huggingface # choices: [huggingface, vllm]