model_name_or_path: Qwen/Qwen2-VL-7B-Instruct template: qwen2_vl infer_backend: huggingface # choices: [huggingface, vllm]