wxcz_admin
/
project0802clean-llm-git


			
				
					
						
						
							1234567891011121314151617181920
							mlflow_project: sft-gsm8k
checkpoint_dir: ${hydra:run.dir}/checkpoint/
csv_dir: ${hydra:run.dir}/csv/  # for saving evaluation results

model_path: huggingface_models/Qwen/Qwen2.5-Math-1.5B
dataset_path: "data_sft/openai/gsm8k"

train_device: cuda:0
eval_device: cuda:1

micro_batch_size: 2
gradient_accumulation_steps: 4
eval_batch_size: 2
num_epochs: 1
learning_rate: 2e-5
weight_decay: 0.01
eval_steps: 1
save_steps: 10