diff --git a/src/llamafactory/data/template.py b/src/llamafactory/data/template.py index 7e1204fd..a0ebeff1 100644 --- a/src/llamafactory/data/template.py +++ b/src/llamafactory/data/template.py @@ -558,6 +558,8 @@ _register_template( format_user=StringFormatter(slots=["<用户>{{content}}"]), format_prefix=EmptyFormatter(slots=[{"bos_token"}]), ) + + _register_template( name="cpm3", format_user=StringFormatter(slots=["<|im_start|>user\n{{content}}<|im_end|>\n<|im_start|>assistant\n"]), @@ -566,6 +568,7 @@ _register_template( stop_words=["<|im_end|>"], ) + _register_template( name="dbrx", format_user=StringFormatter(slots=["<|im_start|>user\n{{content}}<|im_end|>\n<|im_start|>assistant\n"]), diff --git a/src/llamafactory/extras/constants.py b/src/llamafactory/extras/constants.py index 91537877..eadd0973 100644 --- a/src/llamafactory/extras/constants.py +++ b/src/llamafactory/extras/constants.py @@ -806,6 +806,7 @@ register_model_group( template="cpm", ) + register_model_group( models={ "MiniCPM3-4B": { @@ -816,6 +817,7 @@ register_model_group( template="cpm3", ) + register_model_group( models={ "Mistral-7B-v0.1": {