From 0d7d0ea9727d325c5230cbd713780b518a52d87d Mon Sep 17 00:00:00 2001 From: Dhia Eddine Rhaiem <163106757+dhiaEddineRhaiem@users.noreply.github.com> Date: Wed, 18 Jun 2025 12:51:23 +0400 Subject: [PATCH] [model] add support for Falcon H1 (#8403) --- README.md | 1 + src/llamafactory/data/template.py | 13 +++++++ src/llamafactory/extras/constants.py | 55 ++++++++++++++++++++++++++++ 3 files changed, 69 insertions(+) diff --git a/README.md b/README.md index 490f8c0a..d86a5323 100644 --- a/README.md +++ b/README.md @@ -262,6 +262,7 @@ Choose your path: | [DeepSeek 2.5/3](https://huggingface.co/deepseek-ai) | 236B/671B | deepseek3 | | [DeepSeek R1 (Distill)](https://huggingface.co/deepseek-ai) | 1.5B/7B/8B/14B/32B/70B/671B | deepseekr1 | | [Falcon](https://huggingface.co/tiiuae) | 7B/11B/40B/180B | falcon | +| [Falcon-H1](https://huggingface.co/tiiuae) | 0.5B/1.5B/3B/7B/34B | falcon_h1 | | [Gemma/Gemma 2/CodeGemma](https://huggingface.co/google) | 2B/7B/9B/27B | gemma | | [Gemma 3](https://huggingface.co/google) | 1B/4B/12B/27B | gemma3/gemma (1B) | | [GLM-4/GLM-4-0414/GLM-Z1](https://huggingface.co/THUDM) | 9B/32B | glm4/glmz1 | diff --git a/src/llamafactory/data/template.py b/src/llamafactory/data/template.py index ac19b30b..4a769662 100644 --- a/src/llamafactory/data/template.py +++ b/src/llamafactory/data/template.py @@ -916,6 +916,19 @@ register_template( ) +register_template( + name="falcon_h1", + format_user=StringFormatter(slots=["<|im_start|>user\n{{content}}<|im_end|>\n"]), + format_assistant=StringFormatter(slots=["{{content}}<|im_end|>\n"]), + format_system=StringFormatter(slots=["<|im_start|>system\n{{content}}<|im_end|>\n"]), + format_function=FunctionFormatter(slots=["{{content}}<|im_end|>\n"], tool_format="default"), + format_observation=StringFormatter(slots=["<|im_start|>tool\n{{content}}<|im_end|>\n"]), + format_tools=ToolFormatter(tool_format="default"), + format_prefix=EmptyFormatter(slots=[{"bos_token"}]), + stop_words=["<|im_end|>", "<|end_of_text|>"], +) + + register_template( name="fewshot", format_assistant=StringFormatter(slots=["{{content}}\n\n"]), diff --git a/src/llamafactory/extras/constants.py b/src/llamafactory/extras/constants.py index f582d1f0..85c886c0 100644 --- a/src/llamafactory/extras/constants.py +++ b/src/llamafactory/extras/constants.py @@ -633,6 +633,61 @@ register_model_group( template="falcon", ) +register_model_group( + models={ + "Falcon-H1-0.5B-Instruct": { + DownloadSource.DEFAULT: "tiiuae/Falcon-H1-0.5B-Instruct", + DownloadSource.MODELSCOPE: "tiiuae/Falcon-H1-0.5B-Instruct", + }, + "Falcon-H1-0.5B-Base": { + DownloadSource.DEFAULT: "tiiuae/Falcon-H1-0.5B-Base", + DownloadSource.MODELSCOPE: "tiiuae/Falcon-H1-0.5B-Base", + }, + "Falcon-H1-1.5B-Instruct": { + DownloadSource.DEFAULT: "tiiuae/Falcon-H1-1.5B-Instruct", + DownloadSource.MODELSCOPE: "tiiuae/Falcon-H1-1.5B-Instruct", + }, + "Falcon-H1-1.5B-Base": { + DownloadSource.DEFAULT: "tiiuae/Falcon-H1-1.5B-Base", + DownloadSource.MODELSCOPE: "tiiuae/Falcon-H1-1.5B-Base", + }, + "Falcon-H1-1.5B-Deep-Instruct": { + DownloadSource.DEFAULT: "tiiuae/Falcon-H1-1.5B-Deep-Instruct", + DownloadSource.MODELSCOPE: "tiiuae/Falcon-H1-1.5B-Deep-Instruct", + }, + "Falcon-H1-1.5B-Deep-Base": { + DownloadSource.DEFAULT: "tiuae/Falcon-H1-1.5B-Deep-Base", + DownloadSource.MODELSCOPE: "tiiuae/Falcon-H1-1.5B-Deep-Base", + }, + "Falcon-H1-3B-Instruct": { + DownloadSource.DEFAULT: "tiiuae/Falcon-H1-3B-Instruct", + DownloadSource.MODELSCOPE: "tiiuae/Falcon-H1-3B-Instruct", + }, + "Falcon-H1-3B-Base": { + DownloadSource.DEFAULT: "tiiuae/Falcon-H1-3B-Base", + DownloadSource.MODELSCOPE: "tiiuae/Falcon-H1-3B-Base", + }, + "Falcon-H1-7B-Instruct": { + DownloadSource.DEFAULT: "tiiuae/Falcon-H1-7B-Instruct", + DownloadSource.MODELSCOPE: "tiiuae/Falcon-H1-7B-Instruct", + }, + "Falcon-H1-7B-Base": { + DownloadSource.DEFAULT: "tiiuae/Falcon-H1-7B-Base", + DownloadSource.MODELSCOPE: "tiiuae/Falcon-H1-7B-Base", + }, + "Falcon-H1-34B-Instruct": { + DownloadSource.DEFAULT: "tiiuae/Falcon-H1-34B-Instruct", + DownloadSource.MODELSCOPE: "tiiuae/Falcon-H1-34B-Instruct", + }, + "Falcon-H1-34B-Base": { + DownloadSource.DEFAULT: "tiiuae/Falcon-H1-34B-Base", + DownloadSource.MODELSCOPE: "tiiuae/Falcon-H1-34B-Base", + }, + + }, + template="falcon_h1", +) + register_model_group( models={