diff --git a/README.md b/README.md index 952b7b3..02e82fa 100644 --- a/README.md +++ b/README.md @@ -12,7 +12,7 @@ The Alignment Handbook aims to fill that gap by providing the community with a s ## News 🗞️ -* November 10, 2023: We release all the training code to replicate Zephyr 7B 🪁! +* November 10, 2023: We release all the training code to replicate Zephyr-7b-β 🪁! ## Links 🔗 diff --git a/recipes/zephyr-7b-beta/dpo/config_lora.yaml b/recipes/zephyr-7b-beta/dpo/config_lora.yaml index 38ac36a..6d04714 100644 --- a/recipes/zephyr-7b-beta/dpo/config_lora.yaml +++ b/recipes/zephyr-7b-beta/dpo/config_lora.yaml @@ -2,7 +2,7 @@ model_name_or_path: alignment-handbook/zephyr-7b-sft-lora torch_dtype: auto -# LORA +# LoRA arguments use_peft: true lora_r: 64 lora_alpha: 16 diff --git a/recipes/zephyr-7b-beta/sft/config_full.yaml b/recipes/zephyr-7b-beta/sft/config_full.yaml index d73c443..4d8d2d1 100644 --- a/recipes/zephyr-7b-beta/sft/config_full.yaml +++ b/recipes/zephyr-7b-beta/sft/config_full.yaml @@ -32,7 +32,7 @@ output_dir: data/zephyr-7b-sft-full overwrite_output_dir: true per_device_eval_batch_size: 16 per_device_train_batch_size: 32 -push_to_hub: True +push_to_hub: true remove_unused_columns: true report_to: - tensorboard diff --git a/recipes/zephyr-7b-beta/sft/config_lora.yaml b/recipes/zephyr-7b-beta/sft/config_lora.yaml index 3106a01..3eb2d0e 100644 --- a/recipes/zephyr-7b-beta/sft/config_lora.yaml +++ b/recipes/zephyr-7b-beta/sft/config_lora.yaml @@ -44,7 +44,7 @@ output_dir: data/zephyr-7b-sft-lora overwrite_output_dir: true per_device_eval_batch_size: 8 per_device_train_batch_size: 4 -push_to_hub: True +push_to_hub: true report_to: - tensorboard save_strategy: "no" diff --git a/scripts/README.md b/scripts/README.md index 6af993c..d3065e2 100644 --- a/scripts/README.md +++ b/scripts/README.md @@ -32,7 +32,7 @@ ACCELERATE_LOG_LEVEL=info accelerate launch --config_file recipes/accelerate_con ACCELERATE_LOG_LEVEL=info accelerate launch --config_file recipes/accelerate_configs/deepspeed_zero3.yaml scripts/run_dpo.py recipes/zephyr-7b-beta/dpo/config_full.yaml ``` -** 💡 Tip:** If you scale the up/down the number of GPUs, we recommend also scaling up the per-device batch size or number of gradient accumulation steps to keep the global batch size constant (and thus replicate our results). +** 💡 Tip:** If you scale up/down the number of GPUs, we recommend also scaling up the per-device batch size or number of gradient accumulation steps to keep the global batch size constant (and thus replicate our results). By default, these scripts will push each model to your Hugging Face Hub username, i.e. `{username}/{model_name}-{task}`. You can override the parameters in each YAML config by appending them to the command as follows: diff --git a/tests/fixtures/config_sft_full.yaml b/tests/fixtures/config_sft_full.yaml index 81720e9..adf13da 100644 --- a/tests/fixtures/config_sft_full.yaml +++ b/tests/fixtures/config_sft_full.yaml @@ -32,7 +32,7 @@ output_dir: data/zephyr-7b-sft-full overwrite_output_dir: true per_device_eval_batch_size: 16 per_device_train_batch_size: 32 -push_to_hub: True +push_to_hub: true remove_unused_columns: true report_to: - tensorboard