mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2025-12-18 12:50:38 +08:00
[model] add qwen3vl 4b + 8b (#9275)
This commit is contained in:
@@ -3193,14 +3193,22 @@ register_model_group(
|
||||
|
||||
register_model_group(
|
||||
models={
|
||||
"Qwen3-VL-235B-A22B-Instruct": {
|
||||
DownloadSource.DEFAULT: "Qwen/Qwen3-VL-235B-A22B-Instruct",
|
||||
DownloadSource.MODELSCOPE: "Qwen/Qwen3-VL-235B-A22B-Instruct",
|
||||
"Qwen3-VL-4B-Instruct": {
|
||||
DownloadSource.DEFAULT: "Qwen/Qwen3-VL-4B-Instruct",
|
||||
DownloadSource.MODELSCOPE: "Qwen/Qwen3-VL-4B-Instruct",
|
||||
},
|
||||
"Qwen3-VL-8B-Instruct": {
|
||||
DownloadSource.DEFAULT: "Qwen/Qwen3-VL-8B-Instruct",
|
||||
DownloadSource.MODELSCOPE: "Qwen/Qwen3-VL-8B-Instruct",
|
||||
},
|
||||
"Qwen3-VL-30B-A3B-Instruct": {
|
||||
DownloadSource.DEFAULT: "Qwen/Qwen3-VL-30B-A3B-Instruct",
|
||||
DownloadSource.MODELSCOPE: "Qwen/Qwen3-VL-30B-A3B-Instruct",
|
||||
},
|
||||
"Qwen3-VL-235B-A22B-Instruct": {
|
||||
DownloadSource.DEFAULT: "Qwen/Qwen3-VL-235B-A22B-Instruct",
|
||||
DownloadSource.MODELSCOPE: "Qwen/Qwen3-VL-235B-A22B-Instruct",
|
||||
},
|
||||
},
|
||||
template="qwen3_vl_nothink",
|
||||
multimodal=True,
|
||||
@@ -3209,14 +3217,22 @@ register_model_group(
|
||||
|
||||
register_model_group(
|
||||
models={
|
||||
"Qwen3-VL-235B-A22B-Thinking": {
|
||||
DownloadSource.DEFAULT: "Qwen/Qwen3-VL-235B-A22B-Thinking",
|
||||
DownloadSource.MODELSCOPE: "Qwen/Qwen3-VL-235B-A22B-Thinking",
|
||||
"Qwen3-VL-4B-Thinking": {
|
||||
DownloadSource.DEFAULT: "Qwen/Qwen3-VL-4B-Thinking",
|
||||
DownloadSource.MODELSCOPE: "Qwen/Qwen3-VL-4B-Thinking",
|
||||
},
|
||||
"Qwen3-VL-8B-Thinking": {
|
||||
DownloadSource.DEFAULT: "Qwen/Qwen3-VL-8B-Thinking",
|
||||
DownloadSource.MODELSCOPE: "Qwen/Qwen3-VL-8B-Thinking",
|
||||
},
|
||||
"Qwen3-VL-30B-A3B-Thinking": {
|
||||
DownloadSource.DEFAULT: "Qwen/Qwen3-VL-30B-A3B-Thinking",
|
||||
DownloadSource.MODELSCOPE: "Qwen/Qwen3-VL-30B-A3B-Thinking",
|
||||
},
|
||||
"Qwen3-VL-235B-A22B-Thinking": {
|
||||
DownloadSource.DEFAULT: "Qwen/Qwen3-VL-235B-A22B-Thinking",
|
||||
DownloadSource.MODELSCOPE: "Qwen/Qwen3-VL-235B-A22B-Thinking",
|
||||
},
|
||||
},
|
||||
template="qwen3_vl",
|
||||
multimodal=True,
|
||||
|
||||
Reference in New Issue
Block a user