mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2025-12-14 19:06:26 +08:00
@@ -131,6 +131,9 @@ def calculate_mfu(
|
||||
"dataset": "c4_demo",
|
||||
"cutoff_len": seq_length,
|
||||
"output_dir": os.path.join("saves", "test_mfu"),
|
||||
"logging_strategy": "no",
|
||||
"save_strategy": "no",
|
||||
"save_only_model": True,
|
||||
"overwrite_output_dir": True,
|
||||
"per_device_train_batch_size": batch_size,
|
||||
"max_steps": num_steps,
|
||||
|
||||
Reference in New Issue
Block a user