mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2025-07-31 10:42:50 +08:00
[assets] update readme (#8303)
This commit is contained in:
parent
fcd8662306
commit
13fd43617c
@ -493,6 +493,8 @@ Extra dependencies available: torch, torch-npu, metrics, deepspeed, liger-kernel
|
||||
docker run -it --rm --gpus=all --ipc=host hiyouga/llamafactory:latest
|
||||
```
|
||||
|
||||
This image is built on Ubuntu 22.04 (x86\_64), CUDA 12.4, Python 3.11, PyTorch 2.6.0, and Flash-attn 2.7.4.
|
||||
|
||||
Find the pre-built images: https://hub.docker.com/r/hiyouga/llamafactory/tags
|
||||
|
||||
Please refer to [build docker](#build-docker) to build the image yourself.
|
||||
|
@ -495,6 +495,8 @@ pip install -e ".[torch,metrics]" --no-build-isolation
|
||||
docker run -it --rm --gpus=all --ipc=host hiyouga/llamafactory:latest
|
||||
```
|
||||
|
||||
该镜像基于 Ubuntu 22.04(x86\_64)、CUDA 12.4、Python 3.11、PyTorch 2.6.0 和 Flash-attn 2.7.4 构建。
|
||||
|
||||
查看全部镜像:https://hub.docker.com/r/hiyouga/llamafactory/tags
|
||||
|
||||
请参阅[构建 Docker](#构建-docker) 来重新构建镜像。
|
||||
|
@ -513,7 +513,7 @@ register_model_group(
|
||||
|
||||
register_model_group(
|
||||
models={
|
||||
"DeepSeek-V2-236B-0628-Chat": {
|
||||
"DeepSeek-V2-0628-236B-Chat": {
|
||||
DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-V2-Chat-0628",
|
||||
DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-V2-Chat-0628",
|
||||
},
|
||||
@ -521,7 +521,7 @@ register_model_group(
|
||||
DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-V2.5",
|
||||
DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-V2.5",
|
||||
},
|
||||
"DeepSeek-V2.5-236B-1210-Chat": {
|
||||
"DeepSeek-V2.5-1210-236B-Chat": {
|
||||
DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-V2.5-1210",
|
||||
DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-V2.5-1210",
|
||||
},
|
||||
@ -533,7 +533,7 @@ register_model_group(
|
||||
DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-V3",
|
||||
DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-V3",
|
||||
},
|
||||
"DeepSeek-V3-671B-0324-Chat": {
|
||||
"DeepSeek-V3-0324-671B-Chat": {
|
||||
DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-V3-0324",
|
||||
DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-V3-0324",
|
||||
},
|
||||
@ -556,10 +556,6 @@ register_model_group(
|
||||
DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-R1-Distill-Llama-8B",
|
||||
DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-R1-Distill-Llama-8B",
|
||||
},
|
||||
"DeepSeek-R1-8B-0528-Distill": {
|
||||
DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
|
||||
DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
|
||||
},
|
||||
"DeepSeek-R1-14B-Distill": {
|
||||
DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B",
|
||||
DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B",
|
||||
@ -580,7 +576,11 @@ register_model_group(
|
||||
DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-R1",
|
||||
DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-R1",
|
||||
},
|
||||
"DeepSeek-R1-671B-0528-Chat": {
|
||||
"DeepSeek-R1-0528-8B-Distill": {
|
||||
DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
|
||||
DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
|
||||
},
|
||||
"DeepSeek-R1-0528-671B-Chat": {
|
||||
DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-R1-0528",
|
||||
DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-R1-0528",
|
||||
},
|
||||
@ -756,15 +756,15 @@ register_model_group(
|
||||
DownloadSource.DEFAULT: "THUDM/glm-4-9b-chat-1m",
|
||||
DownloadSource.MODELSCOPE: "ZhipuAI/glm-4-9b-chat-1m",
|
||||
},
|
||||
"GLM-4-9B-0414-Chat": {
|
||||
"GLM-4-0414-9B-Chat": {
|
||||
DownloadSource.DEFAULT: "THUDM/GLM-4-9B-0414",
|
||||
DownloadSource.MODELSCOPE: "ZhipuAI/GLM-4-9B-0414",
|
||||
},
|
||||
"GLM-4-32B-0414": {
|
||||
"GLM-4-0414-32B-Base": {
|
||||
DownloadSource.DEFAULT: "THUDM/GLM-4-32B-Base-0414",
|
||||
DownloadSource.MODELSCOPE: "ZhipuAI/GLM-4-32B-Base-0414",
|
||||
},
|
||||
"GLM-4-32B-0414-Chat": {
|
||||
"GLM-4-0414-32B-Chat": {
|
||||
DownloadSource.DEFAULT: "THUDM/GLM-4-32B-0414",
|
||||
DownloadSource.MODELSCOPE: "ZhipuAI/GLM-4-32B-0414",
|
||||
},
|
||||
@ -775,11 +775,11 @@ register_model_group(
|
||||
|
||||
register_model_group(
|
||||
models={
|
||||
"GLM-Z1-9B-0414-Chat": {
|
||||
"GLM-Z1-0414-9B-Chat": {
|
||||
DownloadSource.DEFAULT: "THUDM/GLM-Z1-9B-0414",
|
||||
DownloadSource.MODELSCOPE: "ZhipuAI/GLM-Z1-9B-0414",
|
||||
},
|
||||
"GLM-Z1-32B-0414-Chat": {
|
||||
"GLM-Z1-0414-32B-Chat": {
|
||||
DownloadSource.DEFAULT: "THUDM/GLM-Z1-32B-0414",
|
||||
DownloadSource.MODELSCOPE: "ZhipuAI/GLM-Z1-32B-0414",
|
||||
},
|
||||
|
Loading…
x
Reference in New Issue
Block a user