From 9e4fda326d9c5392b4ce7169768f52b46bdbb59c Mon Sep 17 00:00:00 2001 From: codingma Date: Sun, 7 Apr 2024 11:34:01 +0800 Subject: [PATCH 1/4] support https://github.com/hiyouga/LLaMA-Factory/issues/3152 Former-commit-id: 708f0ab4b0aa72e2c73ca36eb9ed058910e43092 --- src/llmtuner/data/template.py | 9 +++++++++ src/llmtuner/extras/constants.py | 14 ++++++++++++++ 2 files changed, 23 insertions(+) diff --git a/src/llmtuner/data/template.py b/src/llmtuner/data/template.py index 6cc12c56..440030db 100644 --- a/src/llmtuner/data/template.py +++ b/src/llmtuner/data/template.py @@ -773,3 +773,12 @@ _register_template( format_user=StringFormatter(slots=[":{{content}}\n:"]), format_separator=EmptyFormatter(slots=["\n"]), ) + +_register_template( + name="mediatek", + format_user=StringFormatter(slots=["[INST] {{content}} [/INST] "]), + format_system=StringFormatter(slots=[{"bos_token"}, "{{content}}"]), + default_system="You are a helpful AI assistant built by MediaTek Research. The user you are helping speaks Traditional Chinese and comes from Taiwan. ", + force_system=True, + efficient_eos=True, +) \ No newline at end of file diff --git a/src/llmtuner/extras/constants.py b/src/llmtuner/extras/constants.py index 6e46218b..535c7cdb 100644 --- a/src/llmtuner/extras/constants.py +++ b/src/llmtuner/extras/constants.py @@ -969,3 +969,17 @@ register_model_group( }, template="atom", ) + +register_model_group( + models={ + "Breeze-7B": { + DownloadSource.DEFAULT: "MediaTek-Research/Breeze-7B-Base-v1_0", + DownloadSource.MODELSCOPE: "MediaTek-Research/Breeze-7B-Base-v1_0", + }, + "Breeze-7B-Chat": { + DownloadSource.DEFAULT: "MediaTek-Research/Breeze-7B-Instruct-v1_0", + DownloadSource.MODELSCOPE: "MediaTek-Research/Breeze-7B-Instruct-v1_0", + } + }, + template="mediatek", +) \ No newline at end of file From 75866aa0207d131e45eb736201c1fd971536e81b Mon Sep 17 00:00:00 2001 From: codingma Date: Sun, 7 Apr 2024 11:39:54 +0800 Subject: [PATCH 2/4] rename template to breeze Former-commit-id: 1d894e7cfb73b8a29dababb554d051bd50e4f01d --- src/llmtuner/data/template.py | 2 +- src/llmtuner/extras/constants.py | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/src/llmtuner/data/template.py b/src/llmtuner/data/template.py index 440030db..bd9e65e9 100644 --- a/src/llmtuner/data/template.py +++ b/src/llmtuner/data/template.py @@ -775,7 +775,7 @@ _register_template( ) _register_template( - name="mediatek", + name="breeze", format_user=StringFormatter(slots=["[INST] {{content}} [/INST] "]), format_system=StringFormatter(slots=[{"bos_token"}, "{{content}}"]), default_system="You are a helpful AI assistant built by MediaTek Research. The user you are helping speaks Traditional Chinese and comes from Taiwan. ", diff --git a/src/llmtuner/extras/constants.py b/src/llmtuner/extras/constants.py index 535c7cdb..b2ee3058 100644 --- a/src/llmtuner/extras/constants.py +++ b/src/llmtuner/extras/constants.py @@ -981,5 +981,5 @@ register_model_group( DownloadSource.MODELSCOPE: "MediaTek-Research/Breeze-7B-Instruct-v1_0", } }, - template="mediatek", + template="breeze", ) \ No newline at end of file From 1a8a8b8651e30b141daf015cfc1c597712e60272 Mon Sep 17 00:00:00 2001 From: codingma Date: Sun, 7 Apr 2024 18:27:20 +0800 Subject: [PATCH 3/4] rename template to breeze Former-commit-id: 1223e6358dab52b4e1505057f1b16fd9d527c79e --- src/llmtuner/data/template.py | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/src/llmtuner/data/template.py b/src/llmtuner/data/template.py index bd9e65e9..88d7cb86 100644 --- a/src/llmtuner/data/template.py +++ b/src/llmtuner/data/template.py @@ -779,6 +779,5 @@ _register_template( format_user=StringFormatter(slots=["[INST] {{content}} [/INST] "]), format_system=StringFormatter(slots=[{"bos_token"}, "{{content}}"]), default_system="You are a helpful AI assistant built by MediaTek Research. The user you are helping speaks Traditional Chinese and comes from Taiwan. ", - force_system=True, efficient_eos=True, -) \ No newline at end of file +) From 325dafcbb0daee72c436b066edfc0e28c9f03a25 Mon Sep 17 00:00:00 2001 From: codingma Date: Sun, 7 Apr 2024 18:28:08 +0800 Subject: [PATCH 4/4] add empty line Former-commit-id: 1c6c2e611d10e9fa662e3f4e1e7d23b80ae496cb --- src/llmtuner/extras/constants.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/llmtuner/extras/constants.py b/src/llmtuner/extras/constants.py index b2ee3058..34f89324 100644 --- a/src/llmtuner/extras/constants.py +++ b/src/llmtuner/extras/constants.py @@ -982,4 +982,4 @@ register_model_group( } }, template="breeze", -) \ No newline at end of file +)