diff --git a/src/llmtuner/data/template.py b/src/llmtuner/data/template.py index 6cc12c56..440030db 100644 --- a/src/llmtuner/data/template.py +++ b/src/llmtuner/data/template.py @@ -773,3 +773,12 @@ _register_template( format_user=StringFormatter(slots=[":{{content}}\n:"]), format_separator=EmptyFormatter(slots=["\n"]), ) + +_register_template( + name="mediatek", + format_user=StringFormatter(slots=["[INST] {{content}} [/INST] "]), + format_system=StringFormatter(slots=[{"bos_token"}, "{{content}}"]), + default_system="You are a helpful AI assistant built by MediaTek Research. The user you are helping speaks Traditional Chinese and comes from Taiwan. ", + force_system=True, + efficient_eos=True, +) \ No newline at end of file diff --git a/src/llmtuner/extras/constants.py b/src/llmtuner/extras/constants.py index 6e46218b..535c7cdb 100644 --- a/src/llmtuner/extras/constants.py +++ b/src/llmtuner/extras/constants.py @@ -969,3 +969,17 @@ register_model_group( }, template="atom", ) + +register_model_group( + models={ + "Breeze-7B": { + DownloadSource.DEFAULT: "MediaTek-Research/Breeze-7B-Base-v1_0", + DownloadSource.MODELSCOPE: "MediaTek-Research/Breeze-7B-Base-v1_0", + }, + "Breeze-7B-Chat": { + DownloadSource.DEFAULT: "MediaTek-Research/Breeze-7B-Instruct-v1_0", + DownloadSource.MODELSCOPE: "MediaTek-Research/Breeze-7B-Instruct-v1_0", + } + }, + template="mediatek", +) \ No newline at end of file