mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2025-08-02 03:32:50 +08:00
[script] fix vllm version (#7193)
Former-commit-id: 313355759dc906d3612364dc6c8f6344afdedb97
This commit is contained in:
parent
eba31ae313
commit
b6c0e8608e
@ -55,7 +55,7 @@ def vllm_infer(
|
|||||||
Performs batch generation using vLLM engine, which supports tensor parallelism.
|
Performs batch generation using vLLM engine, which supports tensor parallelism.
|
||||||
Usage: python vllm_infer.py --model_name_or_path meta-llama/Llama-2-7b-hf --template llama --dataset alpaca_en_demo
|
Usage: python vllm_infer.py --model_name_or_path meta-llama/Llama-2-7b-hf --template llama --dataset alpaca_en_demo
|
||||||
"""
|
"""
|
||||||
check_version("vllm>=0.4.3,<=0.7.2")
|
check_version("vllm>=0.4.3,<=0.7.3")
|
||||||
if pipeline_parallel_size > get_device_count():
|
if pipeline_parallel_size > get_device_count():
|
||||||
raise ValueError("Pipeline parallel size should be smaller than the number of gpus.")
|
raise ValueError("Pipeline parallel size should be smaller than the number of gpus.")
|
||||||
|
|
||||||
|
Loading…
x
Reference in New Issue
Block a user