diff --git a/src/llamafactory/data/template.py b/src/llamafactory/data/template.py index 818e5625..7e1204fd 100644 --- a/src/llamafactory/data/template.py +++ b/src/llamafactory/data/template.py @@ -558,7 +558,13 @@ _register_template( format_user=StringFormatter(slots=["<用户>{{content}}"]), format_prefix=EmptyFormatter(slots=[{"bos_token"}]), ) - +_register_template( + name="cpm3", + format_user=StringFormatter(slots=["<|im_start|>user\n{{content}}<|im_end|>\n<|im_start|>assistant\n"]), + format_prefix=EmptyFormatter(slots=[{"bos_token"}]), + format_system=StringFormatter(slots=["<|im_start|>system\n{{content}}<|im_end|>\n"]), + stop_words=["<|im_end|>"], +) _register_template( name="dbrx", diff --git a/src/llamafactory/extras/constants.py b/src/llamafactory/extras/constants.py index fc2d3460..91537877 100644 --- a/src/llamafactory/extras/constants.py +++ b/src/llamafactory/extras/constants.py @@ -806,6 +806,15 @@ register_model_group( template="cpm", ) +register_model_group( + models={ + "MiniCPM3-4B": { + DownloadSource.DEFAULT: "openbmb/MiniCPM3-4B", + DownloadSource.MODELSCOPE: "OpenBMB/MiniCPM3-4B", + }, + }, + template="cpm3", +) register_model_group( models={