diff --git a/configs/training_config.yaml b/configs/training_config.yaml index 0bd1316..7602927 100644 --- a/configs/training_config.yaml +++ b/configs/training_config.yaml @@ -13,10 +13,10 @@ training: # Memory-optimized batch size for RTX3070 8GB per_device_train_batch_size: 1 gradient_accumulation_steps: 16 - max_steps: 30 + max_steps: 50 # Training parameters - num_train_epochs: 1 + num_train_epochs: 3 learning_rate: 2.0e-4 warmup_steps: 10 warmup_ratio: 0.1