mirror of
https://github.com/wassname/alignment-handbook.git
synced 2026-06-27 18:41:19 +08:00
Update Zephyr configs to account for UltraFeedback & TRL fixes (#88)
* Add files * Add checkpointing * Add checkpointing to SFT * Add loss type * Fix setup| * Clean SFT * Add lora config * Rename config * Remove max eval samples * Add kwargs tp push to hub * Add DPO configs * Fix dpo configs * Extend chat template test to multi-turn * Add warmup * Refactor * Fix LoRA -> QLoRA * Fix configs * Specify chat template * Add sample logging * Fix push to hub hanging * Add reentrant * Fix quality * Add transformer logging * Tweak grad acc * Add null type * Add doc
This commit is contained in:
@@ -50,21 +50,22 @@ _deps = [
|
||||
"evaluate==0.4.0",
|
||||
"flake8>=6.0.0",
|
||||
"hf-doc-builder>=0.4.0",
|
||||
"hf_transfer>=0.1.4",
|
||||
"huggingface-hub>=0.14.1,<1.0",
|
||||
"isort>=5.12.0",
|
||||
"ninja>=1.11.1",
|
||||
"numpy>=1.24.2",
|
||||
"packaging>=23.0",
|
||||
"parameterized>=0.9.0",
|
||||
"peft==0.6.1",
|
||||
"peft==0.7.1",
|
||||
"protobuf<=3.20.2", # Needed to avoid conflicts with `transformers`
|
||||
"pytest",
|
||||
"safetensors>=0.3.3",
|
||||
"scipy",
|
||||
"tensorboard",
|
||||
"torch==2.1.0",
|
||||
"transformers==4.35.0",
|
||||
"trl==0.7.4",
|
||||
"torch==2.1.2",
|
||||
"transformers==4.36.2",
|
||||
"trl==0.7.7",
|
||||
"jinja2>=3.0.0",
|
||||
"tqdm>=4.64.1",
|
||||
]
|
||||
|
||||
Reference in New Issue
Block a user