diff --git a/recipes/zephyr-7b-beta/sft/config_lora.yaml b/recipes/zephyr-7b-beta/sft/config_lora.yaml index 286166a..f45c5fc 100644 --- a/recipes/zephyr-7b-beta/sft/config_lora.yaml +++ b/recipes/zephyr-7b-beta/sft/config_lora.yaml @@ -49,4 +49,5 @@ report_to: - tensorboard save_strategy: "no" save_total_limit: null -seed: 42 \ No newline at end of file +seed: 42 +warmup_ratio: 0.1