[release] Bye 2025 (#9702)

2026-03-04 02:35:59 +08:00 · 2025-12-31 22:22:40 +08:00
parent 000526908a
commit 95ac3f2373
59 changed files with 154 additions and 401 deletions
--- a/examples/train_lora/qwen3_preprocess.yaml
+++ b/examples/train_lora/qwen3_preprocess.yaml
@@ -0,0 +1,22 @@
+### model
+model_name_or_path: Qwen/Qwen3-4B-Instruct-2507
+trust_remote_code: true
+
+### method
+stage: sft
+do_train: true
+finetuning_type: lora
+lora_rank: 8
+lora_target: all
+
+### dataset
+dataset: identity,alpaca_en_demo
+template: qwen3_nothink
+cutoff_len: 2048
+max_samples: 1000
+preprocessing_num_workers: 16
+tokenized_path: saves/qwen3-4b/dataset/sft
+
+### output (not used)
+output_dir: saves/qwen3-4b/lora/sft
+overwrite_output_dir: true