Files
SimPO/justfile
T
wassname 934a2ffb5d wip
2025-06-02 05:26:08 +00:00

52 lines
1.9 KiB
Makefile

llama-3-2-1b:
. ./.venv/bin/activate
cp accelerate_configs/deepspeed_zero3.yaml alignment-handbook/recipes/accelerate_configs/deepspeed_zero3b.yaml
cp training_configs/llama-3-2-1b-base-sft.yaml alignment-handbook/recipes/llama-3-2-1b-base-sft.yaml
# .venv/src/alignment-handbook/
cd alignment-handbook
ACCELERATE_LOG_LEVEL=info accelerate launch --config_file recipes/accelerate_configs/deepspeed_zero3b.yaml --num_processes=1 scripts/run_sft.py recipes/llama-3-2-1b-base-sft.yaml
# old:
# #!/bin/zsh
# . ./.venv/bin/activate
# cp accelerate_configs/deepspeed_zero3.yaml alignment-handbook/recipes/accelerate_configs/deepspeed_zero3b.yaml
# cp training_configs/llama-3-2-3b-base-sft.yaml alignment-handbook/recipes/llama-3-2-3b-base-sft.yaml
# # .venv/src/alignment-handbook/
# cd alignment-handbook
# ACCELERATE_LOG_LEVEL=info accelerate launch --config_file recipes/accelerate_configs/deepspeed_zero3b.yaml --num_processes=1 scripts/run_sft.py recipes/llama-3-2-3b-base-sft.yaml
install:
uv sync --no-build-isolation
# uv add --no-build-isolation flash-attn
# install_old:
# # install mambaforge
# wget bash https://github.com/conda-forge/miniforge/releases/latest/download/Miniforge3-Linux-x86_64.sh
# bash Miniforge3-Linux-x86_64.sh -b -p /workspace/miniforge3
# /workspace/miniforge3/bin/conda init zsh
# source /root/.zshrc
# # git clone https://github.com/princeton-nlp/SimPO.git
# # make env
# conda create -n handbook python=3.10
# conda activate handbook
# # install torch
# mamba install pytorch torchvision torchaudio pytorch-cuda=12.4 -c pytorch -c nvidia
# # install alignment handbook
# # or use .venv/src/alignment-handbook/
# git clone https://github.com/huggingface/alignment-handbook.git
# cd ./alignment-handbook/
# python -m pip install .
# python -m pip install flash-attn --no-build-isolation
# cd ..