[data] fix qwen omni plugin (#9204)

Co-authored-by: kingsley <kingsleydodonow@gmail.com>
2026-06-10 17:28:55 +08:00 · 2025-09-28 01:02:29 +08:00
parent 0761a4448f
commit 6ffebe5ff7
15 changed files with 292 additions and 210 deletions
--- a/src/llamafactory/extras/constants.py
+++ b/src/llamafactory/extras/constants.py
@@ -3060,13 +3060,14 @@ register_model_group(
    multimodal=True,
 )

+
 register_model_group(
    models={
-        "Qwen/Qwen3-Omni-30B-A3B-Captioner": {
+        "Qwen3-Omni-30B-A3B-Captioner": {
            DownloadSource.DEFAULT: "Qwen/Qwen3-Omni-30B-A3B-Captioner",
            DownloadSource.MODELSCOPE: "Qwen/Qwen3-Omni-30B-A3B-Captioner",
        },
-        "Qwen/Qwen3-Omni-30B-A3B-Instruct": {
+        "Qwen3-Omni-30B-A3B-Instruct": {
            DownloadSource.DEFAULT: "Qwen/Qwen3-Omni-30B-A3B-Instruct",
            DownloadSource.MODELSCOPE: "Qwen/Qwen3-Omni-30B-A3B-Instruct",
        },
@@ -3075,9 +3076,10 @@ register_model_group(
    multimodal=True,
 )

+
 register_model_group(
    models={
-        "Qwen/Qwen3-Omni-30B-A3B-Thinking": {
+        "Qwen3-Omni-30B-A3B-Thinking": {
            DownloadSource.DEFAULT: "Qwen/Qwen3-Omni-30B-A3B-Thinking",
            DownloadSource.MODELSCOPE: "Qwen/Qwen3-Omni-30B-A3B-Thinking",
        },
@@ -3086,6 +3088,7 @@ register_model_group(
    multimodal=True,
 )

+
 register_model_group(
    models={
        "Qwen2-VL-2B": {
@@ -3190,24 +3193,24 @@ register_model_group(

 register_model_group(
    models={
-        "Qwen/Qwen3-VL-235B-A22B-Thinking": {
-            DownloadSource.DEFAULT: "Qwen/Qwen3-VL-235B-A22B-Thinking",
-            DownloadSource.MODELSCOPE: "Qwen/Qwen3-VL-235B-A22B-Thinking",
+        "Qwen3-VL-235B-A22B-Instruct": {
+            DownloadSource.DEFAULT: "Qwen/Qwen3-VL-235B-A22B-Instruct",
+            DownloadSource.MODELSCOPE: "Qwen/Qwen3-VL-235B-A22B-Instruct",
        },
    },
-    template="qwen3_vl",
+    template="qwen3_vl_nothink",
    multimodal=True,
 )


 register_model_group(
    models={
-        "Qwen/Qwen3-VL-235B-A22B-Instruct": {
-            DownloadSource.DEFAULT: "Qwen/Qwen3-VL-235B-A22B-Instruct",
-            DownloadSource.MODELSCOPE: "Qwen/Qwen3-VL-235B-A22B-Instruct",
+        "Qwen3-VL-235B-A22B-Thinking": {
+            DownloadSource.DEFAULT: "Qwen/Qwen3-VL-235B-A22B-Thinking",
+            DownloadSource.MODELSCOPE: "Qwen/Qwen3-VL-235B-A22B-Thinking",
        },
    },
-    template="qwen3_vl_nothink",
+    template="qwen3_vl",
    multimodal=True,
 )

--- a/src/llamafactory/extras/misc.py
+++ b/src/llamafactory/extras/misc.py
@@ -94,7 +94,7 @@ def check_version(requirement: str, mandatory: bool = False) -> None:

 def check_dependencies() -> None:
    r"""Check the version of the required packages."""
-    check_version("transformers>=4.49.0,<=4.56.1")
+    check_version("transformers>=4.49.0,<=4.56.2")
    check_version("datasets>=2.16.0,<=4.0.0")
    check_version("accelerate>=1.3.0,<=1.10.1")
    check_version("peft>=0.14.0,<=0.17.1")