mirror of
https://github.com/wassname/SimPO.git
synced 2026-06-27 17:46:46 +08:00
49 lines
1.8 KiB
Makefile
49 lines
1.8 KiB
Makefile
|
|
|
|
|
|
sft:
|
|
. ./.venv/bin/activate
|
|
|
|
cp accelerate_configs/deepspeed_zero3.yaml alignment-handbook/recipes/accelerate_configs/deepspeed_zero3b.yaml
|
|
cp training_configs/llama-3-2-1b-base-sft.yaml alignment-handbook/recipes/llama-3-2-1b-base-sft.yaml
|
|
|
|
# .venv/src/alignment-handbook/
|
|
cd alignment-handbook
|
|
ACCELERATE_LOG_LEVEL=info accelerate launch --config_file recipes/accelerate_configs/deepspeed_zero3b.yaml --num_processes=1 scripts/run_sft.py recipes/llama-3-2-1b-base-sft.yaml
|
|
|
|
|
|
b3:
|
|
#!/bin/zsh
|
|
. ./.venv/bin/activate
|
|
|
|
cp accelerate_configs/deepspeed_zero3.yaml alignment-handbook/recipes/accelerate_configs/deepspeed_zero3b.yaml
|
|
cp training_configs/llama-3-2-3b-base-sft.yaml alignment-handbook/recipes/llama-3-2-3b-base-sft.yaml
|
|
|
|
# .venv/src/alignment-handbook/
|
|
cd alignment-handbook
|
|
ACCELERATE_LOG_LEVEL=info accelerate launch --config_file recipes/accelerate_configs/deepspeed_zero3b.yaml --num_processes=1 scripts/run_sft.py recipes/llama-3-2-3b-base-sft.yaml
|
|
|
|
|
|
install:
|
|
# install mambaforge
|
|
wget bash https://github.com/conda-forge/miniforge/releases/latest/download/Miniforge3-Linux-x86_64.sh
|
|
bash Miniforge3-Linux-x86_64.sh -b -p /workspace/miniforge3
|
|
/workspace/miniforge3/bin/conda init zsh
|
|
source /root/.zshrc
|
|
|
|
# git clone https://github.com/princeton-nlp/SimPO.git
|
|
|
|
# make env
|
|
conda create -n handbook python=3.10
|
|
conda activate handbook
|
|
# install torch
|
|
mamba install pytorch torchvision torchaudio pytorch-cuda=12.4 -c pytorch -c nvidia
|
|
|
|
# install alignment handbook
|
|
# or use .venv/src/alignment-handbook/
|
|
git clone https://github.com/huggingface/alignment-handbook.git
|
|
cd ./alignment-handbook/
|
|
python -m pip install .
|
|
python -m pip install flash-attn --no-build-isolation
|
|
cd ..
|