From 80aa1f70b66fe0b674f73de9d49ca1bd4a73fb9c Mon Sep 17 00:00:00 2001 From: codingma Date: Sun, 7 Apr 2024 11:34:01 +0800 Subject: [PATCH 1/4] support https://github.com/hiyouga/LLaMA-Factory/issues/3152 Former-commit-id: 2565a32bd98ef46a3b6e1a5c334093ca46b820d2 --- src/llmtuner/data/template.py | 9 +++++++++ src/llmtuner/extras/constants.py | 14 ++++++++++++++ 2 files changed, 23 insertions(+) diff --git a/src/llmtuner/data/template.py b/src/llmtuner/data/template.py index 6cc12c56..440030db 100644 --- a/src/llmtuner/data/template.py +++ b/src/llmtuner/data/template.py @@ -773,3 +773,12 @@ _register_template( format_user=StringFormatter(slots=[":{{content}}\n:"]), format_separator=EmptyFormatter(slots=["\n"]), ) + +_register_template( + name="mediatek", + format_user=StringFormatter(slots=["[INST] {{content}} [/INST] "]), + format_system=StringFormatter(slots=[{"bos_token"}, "{{content}}"]), + default_system="You are a helpful AI assistant built by MediaTek Research. The user you are helping speaks Traditional Chinese and comes from Taiwan. ", + force_system=True, + efficient_eos=True, +) \ No newline at end of file diff --git a/src/llmtuner/extras/constants.py b/src/llmtuner/extras/constants.py index 6e46218b..535c7cdb 100644 --- a/src/llmtuner/extras/constants.py +++ b/src/llmtuner/extras/constants.py @@ -969,3 +969,17 @@ register_model_group( }, template="atom", ) + +register_model_group( + models={ + "Breeze-7B": { + DownloadSource.DEFAULT: "MediaTek-Research/Breeze-7B-Base-v1_0", + DownloadSource.MODELSCOPE: "MediaTek-Research/Breeze-7B-Base-v1_0", + }, + "Breeze-7B-Chat": { + DownloadSource.DEFAULT: "MediaTek-Research/Breeze-7B-Instruct-v1_0", + DownloadSource.MODELSCOPE: "MediaTek-Research/Breeze-7B-Instruct-v1_0", + } + }, + template="mediatek", +) \ No newline at end of file From ed14f8bae753872cf9744d592f070265b25823b6 Mon Sep 17 00:00:00 2001 From: codingma Date: Sun, 7 Apr 2024 11:39:54 +0800 Subject: [PATCH 2/4] rename template to breeze Former-commit-id: 5a780e9eec7e8c560d417c1a95afa1be0f878d32 --- src/llmtuner/data/template.py | 2 +- src/llmtuner/extras/constants.py | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/src/llmtuner/data/template.py b/src/llmtuner/data/template.py index 440030db..bd9e65e9 100644 --- a/src/llmtuner/data/template.py +++ b/src/llmtuner/data/template.py @@ -775,7 +775,7 @@ _register_template( ) _register_template( - name="mediatek", + name="breeze", format_user=StringFormatter(slots=["[INST] {{content}} [/INST] "]), format_system=StringFormatter(slots=[{"bos_token"}, "{{content}}"]), default_system="You are a helpful AI assistant built by MediaTek Research. The user you are helping speaks Traditional Chinese and comes from Taiwan. ", diff --git a/src/llmtuner/extras/constants.py b/src/llmtuner/extras/constants.py index 535c7cdb..b2ee3058 100644 --- a/src/llmtuner/extras/constants.py +++ b/src/llmtuner/extras/constants.py @@ -981,5 +981,5 @@ register_model_group( DownloadSource.MODELSCOPE: "MediaTek-Research/Breeze-7B-Instruct-v1_0", } }, - template="mediatek", + template="breeze", ) \ No newline at end of file From fecab4d3f197f1231d3f6e50531a5e26a0029967 Mon Sep 17 00:00:00 2001 From: codingma Date: Sun, 7 Apr 2024 18:27:20 +0800 Subject: [PATCH 3/4] rename template to breeze Former-commit-id: 34bdcba0176a1612ab10351e59927ea744c6749c --- src/llmtuner/data/template.py | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/src/llmtuner/data/template.py b/src/llmtuner/data/template.py index bd9e65e9..88d7cb86 100644 --- a/src/llmtuner/data/template.py +++ b/src/llmtuner/data/template.py @@ -779,6 +779,5 @@ _register_template( format_user=StringFormatter(slots=["[INST] {{content}} [/INST] "]), format_system=StringFormatter(slots=[{"bos_token"}, "{{content}}"]), default_system="You are a helpful AI assistant built by MediaTek Research. The user you are helping speaks Traditional Chinese and comes from Taiwan. ", - force_system=True, efficient_eos=True, -) \ No newline at end of file +) From b5f0ac4c3fd65008c02f0da110ca747094ddcb33 Mon Sep 17 00:00:00 2001 From: codingma Date: Sun, 7 Apr 2024 18:28:08 +0800 Subject: [PATCH 4/4] add empty line Former-commit-id: 7b76b4ca08066af0465f138fa756615cbaef32ad --- src/llmtuner/extras/constants.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/llmtuner/extras/constants.py b/src/llmtuner/extras/constants.py index b2ee3058..34f89324 100644 --- a/src/llmtuner/extras/constants.py +++ b/src/llmtuner/extras/constants.py @@ -982,4 +982,4 @@ register_model_group( } }, template="breeze", -) \ No newline at end of file +)