mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2026-01-10 08:00:36 +08:00
[release] Bye 2025 (#9702)
This commit is contained in:
22
examples/train_lora/qwen3_preprocess.yaml
Normal file
22
examples/train_lora/qwen3_preprocess.yaml
Normal file
@@ -0,0 +1,22 @@
|
||||
### model
|
||||
model_name_or_path: Qwen/Qwen3-4B-Instruct-2507
|
||||
trust_remote_code: true
|
||||
|
||||
### method
|
||||
stage: sft
|
||||
do_train: true
|
||||
finetuning_type: lora
|
||||
lora_rank: 8
|
||||
lora_target: all
|
||||
|
||||
### dataset
|
||||
dataset: identity,alpaca_en_demo
|
||||
template: qwen3_nothink
|
||||
cutoff_len: 2048
|
||||
max_samples: 1000
|
||||
preprocessing_num_workers: 16
|
||||
tokenized_path: saves/qwen3-4b/dataset/sft
|
||||
|
||||
### output (not used)
|
||||
output_dir: saves/qwen3-4b/lora/sft
|
||||
overwrite_output_dir: true
|
||||
Reference in New Issue
Block a user