From 13fd43617ca4b05880527f6609f44c7ff04bbe93 Mon Sep 17 00:00:00 2001 From: Yaowei Zheng Date: Thu, 5 Jun 2025 23:23:15 +0800 Subject: [PATCH] [assets] update readme (#8303) --- README.md | 2 ++ README_zh.md | 2 ++ src/llamafactory/extras/constants.py | 26 +++++++++++++------------- 3 files changed, 17 insertions(+), 13 deletions(-) diff --git a/README.md b/README.md index 5516a1b7..85dc4768 100644 --- a/README.md +++ b/README.md @@ -493,6 +493,8 @@ Extra dependencies available: torch, torch-npu, metrics, deepspeed, liger-kernel docker run -it --rm --gpus=all --ipc=host hiyouga/llamafactory:latest ``` +This image is built on Ubuntu 22.04 (x86\_64), CUDA 12.4, Python 3.11, PyTorch 2.6.0, and Flash-attn 2.7.4. + Find the pre-built images: https://hub.docker.com/r/hiyouga/llamafactory/tags Please refer to [build docker](#build-docker) to build the image yourself. diff --git a/README_zh.md b/README_zh.md index abd2f503..b3edfdfe 100644 --- a/README_zh.md +++ b/README_zh.md @@ -495,6 +495,8 @@ pip install -e ".[torch,metrics]" --no-build-isolation docker run -it --rm --gpus=all --ipc=host hiyouga/llamafactory:latest ``` +该镜像基于 Ubuntu 22.04(x86\_64)、CUDA 12.4、Python 3.11、PyTorch 2.6.0 和 Flash-attn 2.7.4 构建。 + 查看全部镜像:https://hub.docker.com/r/hiyouga/llamafactory/tags 请参阅[构建 Docker](#构建-docker) 来重新构建镜像。 diff --git a/src/llamafactory/extras/constants.py b/src/llamafactory/extras/constants.py index 06e450c9..a9d5b7cd 100644 --- a/src/llamafactory/extras/constants.py +++ b/src/llamafactory/extras/constants.py @@ -513,7 +513,7 @@ register_model_group( register_model_group( models={ - "DeepSeek-V2-236B-0628-Chat": { + "DeepSeek-V2-0628-236B-Chat": { DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-V2-Chat-0628", DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-V2-Chat-0628", }, @@ -521,7 +521,7 @@ register_model_group( DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-V2.5", DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-V2.5", }, - "DeepSeek-V2.5-236B-1210-Chat": { + "DeepSeek-V2.5-1210-236B-Chat": { DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-V2.5-1210", DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-V2.5-1210", }, @@ -533,7 +533,7 @@ register_model_group( DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-V3", DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-V3", }, - "DeepSeek-V3-671B-0324-Chat": { + "DeepSeek-V3-0324-671B-Chat": { DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-V3-0324", DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-V3-0324", }, @@ -556,10 +556,6 @@ register_model_group( DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-R1-Distill-Llama-8B", }, - "DeepSeek-R1-8B-0528-Distill": { - DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", - DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", - }, "DeepSeek-R1-14B-Distill": { DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", @@ -580,7 +576,11 @@ register_model_group( DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-R1", DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-R1", }, - "DeepSeek-R1-671B-0528-Chat": { + "DeepSeek-R1-0528-8B-Distill": { + DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", + DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B", + }, + "DeepSeek-R1-0528-671B-Chat": { DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-R1-0528", DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-R1-0528", }, @@ -756,15 +756,15 @@ register_model_group( DownloadSource.DEFAULT: "THUDM/glm-4-9b-chat-1m", DownloadSource.MODELSCOPE: "ZhipuAI/glm-4-9b-chat-1m", }, - "GLM-4-9B-0414-Chat": { + "GLM-4-0414-9B-Chat": { DownloadSource.DEFAULT: "THUDM/GLM-4-9B-0414", DownloadSource.MODELSCOPE: "ZhipuAI/GLM-4-9B-0414", }, - "GLM-4-32B-0414": { + "GLM-4-0414-32B-Base": { DownloadSource.DEFAULT: "THUDM/GLM-4-32B-Base-0414", DownloadSource.MODELSCOPE: "ZhipuAI/GLM-4-32B-Base-0414", }, - "GLM-4-32B-0414-Chat": { + "GLM-4-0414-32B-Chat": { DownloadSource.DEFAULT: "THUDM/GLM-4-32B-0414", DownloadSource.MODELSCOPE: "ZhipuAI/GLM-4-32B-0414", }, @@ -775,11 +775,11 @@ register_model_group( register_model_group( models={ - "GLM-Z1-9B-0414-Chat": { + "GLM-Z1-0414-9B-Chat": { DownloadSource.DEFAULT: "THUDM/GLM-Z1-9B-0414", DownloadSource.MODELSCOPE: "ZhipuAI/GLM-Z1-9B-0414", }, - "GLM-Z1-32B-0414-Chat": { + "GLM-Z1-0414-32B-Chat": { DownloadSource.DEFAULT: "THUDM/GLM-Z1-32B-0414", DownloadSource.MODELSCOPE: "ZhipuAI/GLM-Z1-32B-0414", },