diff --git a/README.md b/README.md index 7e3c0c895..d238101e6 100644 --- a/README.md +++ b/README.md @@ -336,6 +336,7 @@ Read technical notes: | [Skywork o1](https://huggingface.co/Skywork) | 8B | skywork_o1 | | [StarCoder 2](https://huggingface.co/bigcode) | 3B/7B/15B | - | | [TeleChat2](https://huggingface.co/Tele-AI) | 3B/7B/35B/115B | telechat2 | +| [VibeThinker-1.5B](https://huggingface.co/WeiboAI) | 1.5B | qwen3 | | [XVERSE](https://huggingface.co/xverse) | 7B/13B/65B | xverse | | [Yi/Yi-1.5 (Code)](https://huggingface.co/01-ai) | 1.5B/6B/9B/34B | yi | | [Yi-VL](https://huggingface.co/01-ai) | 6B/34B | yi_vl | diff --git a/README_zh.md b/README_zh.md index ba7ed90ba..50e805005 100644 --- a/README_zh.md +++ b/README_zh.md @@ -338,6 +338,7 @@ https://github.com/user-attachments/assets/43b700c6-a178-41db-b1f8-8190a5d3fcfc | [Skywork o1](https://huggingface.co/Skywork) | 8B | skywork_o1 | | [StarCoder 2](https://huggingface.co/bigcode) | 3B/7B/15B | - | | [TeleChat2](https://huggingface.co/Tele-AI) | 3B/7B/35B/115B | telechat2 | +| [VibeThinker-1.5B](https://huggingface.co/WeiboAI) | 1.5B | qwen3 | | [XVERSE](https://huggingface.co/xverse) | 7B/13B/65B | xverse | | [Yi/Yi-1.5 (Code)](https://huggingface.co/01-ai) | 1.5B/6B/9B/34B | yi | | [Yi-VL](https://huggingface.co/01-ai) | 6B/34B | yi_vl | diff --git a/src/llamafactory/extras/constants.py b/src/llamafactory/extras/constants.py index e0d4cbd90..aec67ca85 100644 --- a/src/llamafactory/extras/constants.py +++ b/src/llamafactory/extras/constants.py @@ -3520,6 +3520,17 @@ register_model_group( ) +register_model_group( + models={ + "VibeThinker-1.5B": { + DownloadSource.DEFAULT: "WeiboAI/VibeThinker-1.5B", + DownloadSource.MODELSCOPE: "WeiboAI/VibeThinker-1.5B", + }, + }, + template="qwen3", +) + + register_model_group( models={ "Vicuna-v1.5-7B-Chat": {