Files
SimPO/justfile
T
wassname 53af87561f bs
2024-09-30 12:56:06 +00:00

42 lines
1.9 KiB
Makefile

sft:
# ok so I gave up on getting sympo working, I just used the alignment handbook
# but hte potry is here
. ./.venv/bin/activate
# ACCELERATE_LOG_LEVEL=info accelerate launch --config_file accelerate_configs/deepspeed_zero3.yaml scripts/run_simpo.py training_configs/llama-3-2-1b-base-sft.yaml
# ACCELERATE_LOG_LEVEL=info accelerate launch --config_file recipes/accelerate_configs/deepspeed_zero3b.yaml --num_processes=1 scripts/run_sft.py recipes/llama-3-2-1b-base-sft.yaml
cp accelerate_configs/deepspeed_zero3.yaml alignment-handbook/recipes/accelerate_configs/deepspeed_zero3b.yaml
cp training_configs/llama-3-2-1b-base-sft.yaml alignment-handbook/recipes/llama-3-2-1b-base-sft.yaml
# .venv/src/alignment-handbook/
cd alignment-handbook
ACCELERATE_LOG_LEVEL=info accelerate launch --config_file recipes/accelerate_configs/deepspeed_zero3b.yaml --num_processes=1 scripts/run_sft.py recipes/llama-3-2-1b-base-sft.yaml
# ACCELERATE_LOG_LEVEL=info accelerate launch --config_file ../accelerate_configs/deepspeed_zero3.yaml --num_processes=1 scripts/run_sft.py ../training_configs/llama-3-2-1b-base-sft.yaml
install:
# install mambaforge
wget bash https://github.com/conda-forge/miniforge/releases/latest/download/Miniforge3-Linux-x86_64.sh
bash Miniforge3-Linux-x86_64.sh -b -p /workspace/miniforge3
/workspace/miniforge3/bin/conda init zsh
source /root/.zshrc
# git clone https://github.com/princeton-nlp/SimPO.git
# make env
conda create -n handbook python=3.10
conda activate handbook
# install torch
mamba install pytorch torchvision torchaudio pytorch-cuda=12.4 -c pytorch -c nvidia
# install alignment handbook
# or use .venv/src/alignment-handbook/
git clone https://github.com/huggingface/alignment-handbook.git
cd ./alignment-handbook/
python -m pip install .
python -m pip install flash-attn --no-build-isolation
cd ..