mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2025-08-02 03:32:50 +08:00
update examples
Former-commit-id: fc7f1cc365ee481b76f9c7e6f1947b49cf131fbf
This commit is contained in:
parent
03c538ebb3
commit
86513f28dc
@ -3,7 +3,7 @@ We provide diverse examples about fine-tuning LLMs.
|
|||||||
```
|
```
|
||||||
examples/
|
examples/
|
||||||
├── lora_single_gpu/
|
├── lora_single_gpu/
|
||||||
│ ├── pt.sh: Do pre-training
|
│ ├── pretrain.sh: Do pre-training
|
||||||
│ ├── sft.sh: Do supervised fine-tuning
|
│ ├── sft.sh: Do supervised fine-tuning
|
||||||
│ ├── reward.sh: Do reward modeling
|
│ ├── reward.sh: Do reward modeling
|
||||||
│ ├── ppo.sh: Do PPO training
|
│ ├── ppo.sh: Do PPO training
|
||||||
|
@ -3,7 +3,7 @@
|
|||||||
```
|
```
|
||||||
examples/
|
examples/
|
||||||
├── lora_single_gpu/
|
├── lora_single_gpu/
|
||||||
│ ├── pt.sh: 进行预训练
|
│ ├── pretrain.sh: 进行预训练
|
||||||
│ ├── sft.sh: 进行指令监督微调
|
│ ├── sft.sh: 进行指令监督微调
|
||||||
│ ├── reward.sh: 进行奖励模型训练
|
│ ├── reward.sh: 进行奖励模型训练
|
||||||
│ ├── ppo.sh: 进行 PPO 训练
|
│ ├── ppo.sh: 进行 PPO 训练
|
||||||
|
@ -6,7 +6,7 @@ CUDA_VISIBLE_DEVICES=0 python ../../src/train_bash.py \
|
|||||||
--model_name_or_path meta-llama/Llama-2-7b-hf \
|
--model_name_or_path meta-llama/Llama-2-7b-hf \
|
||||||
--adapter_name_or_path ../../saves/LLaMA2-7B/lora/sft \
|
--adapter_name_or_path ../../saves/LLaMA2-7B/lora/sft \
|
||||||
--create_new_adapter \
|
--create_new_adapter \
|
||||||
--dataset comparison_gpt4_en \
|
--dataset orca_rlhf \
|
||||||
--dataset_dir ../../data \
|
--dataset_dir ../../data \
|
||||||
--template default \
|
--template default \
|
||||||
--finetuning_type lora \
|
--finetuning_type lora \
|
||||||
|
@ -6,7 +6,7 @@ CUDA_VISIBLE_DEVICES=0 python ../../src/train_bash.py \
|
|||||||
--model_name_or_path meta-llama/Llama-2-7b-hf \
|
--model_name_or_path meta-llama/Llama-2-7b-hf \
|
||||||
--adapter_name_or_path ../../saves/LLaMA2-7B/lora/sft \
|
--adapter_name_or_path ../../saves/LLaMA2-7B/lora/sft \
|
||||||
--create_new_adapter \
|
--create_new_adapter \
|
||||||
--dataset comparison_gpt4_en \
|
--dataset orca_rlhf \
|
||||||
--dataset_dir ../../data \
|
--dataset_dir ../../data \
|
||||||
--template default \
|
--template default \
|
||||||
--finetuning_type lora \
|
--finetuning_type lora \
|
||||||
|
Loading…
x
Reference in New Issue
Block a user