mirror of
https://github.com/wassname/SimPO.git
synced 2026-06-27 18:21:59 +08:00
wip
This commit is contained in:
@@ -1,7 +1,7 @@
|
||||
|
||||
|
||||
|
||||
sft:
|
||||
llama-3-2-1b:
|
||||
. ./.venv/bin/activate
|
||||
|
||||
cp accelerate_configs/deepspeed_zero3.yaml alignment-handbook/recipes/accelerate_configs/deepspeed_zero3b.yaml
|
||||
@@ -12,37 +12,40 @@ sft:
|
||||
ACCELERATE_LOG_LEVEL=info accelerate launch --config_file recipes/accelerate_configs/deepspeed_zero3b.yaml --num_processes=1 scripts/run_sft.py recipes/llama-3-2-1b-base-sft.yaml
|
||||
|
||||
|
||||
b3:
|
||||
#!/bin/zsh
|
||||
. ./.venv/bin/activate
|
||||
# old:
|
||||
# #!/bin/zsh
|
||||
# . ./.venv/bin/activate
|
||||
|
||||
cp accelerate_configs/deepspeed_zero3.yaml alignment-handbook/recipes/accelerate_configs/deepspeed_zero3b.yaml
|
||||
cp training_configs/llama-3-2-3b-base-sft.yaml alignment-handbook/recipes/llama-3-2-3b-base-sft.yaml
|
||||
# cp accelerate_configs/deepspeed_zero3.yaml alignment-handbook/recipes/accelerate_configs/deepspeed_zero3b.yaml
|
||||
# cp training_configs/llama-3-2-3b-base-sft.yaml alignment-handbook/recipes/llama-3-2-3b-base-sft.yaml
|
||||
|
||||
# .venv/src/alignment-handbook/
|
||||
cd alignment-handbook
|
||||
ACCELERATE_LOG_LEVEL=info accelerate launch --config_file recipes/accelerate_configs/deepspeed_zero3b.yaml --num_processes=1 scripts/run_sft.py recipes/llama-3-2-3b-base-sft.yaml
|
||||
|
||||
# # .venv/src/alignment-handbook/
|
||||
# cd alignment-handbook
|
||||
# ACCELERATE_LOG_LEVEL=info accelerate launch --config_file recipes/accelerate_configs/deepspeed_zero3b.yaml --num_processes=1 scripts/run_sft.py recipes/llama-3-2-3b-base-sft.yaml
|
||||
|
||||
install:
|
||||
# install mambaforge
|
||||
wget bash https://github.com/conda-forge/miniforge/releases/latest/download/Miniforge3-Linux-x86_64.sh
|
||||
bash Miniforge3-Linux-x86_64.sh -b -p /workspace/miniforge3
|
||||
/workspace/miniforge3/bin/conda init zsh
|
||||
source /root/.zshrc
|
||||
uv sync --no-build-isolation
|
||||
# uv add --no-build-isolation flash-attn
|
||||
|
||||
# git clone https://github.com/princeton-nlp/SimPO.git
|
||||
# install_old:
|
||||
# # install mambaforge
|
||||
# wget bash https://github.com/conda-forge/miniforge/releases/latest/download/Miniforge3-Linux-x86_64.sh
|
||||
# bash Miniforge3-Linux-x86_64.sh -b -p /workspace/miniforge3
|
||||
# /workspace/miniforge3/bin/conda init zsh
|
||||
# source /root/.zshrc
|
||||
|
||||
# make env
|
||||
conda create -n handbook python=3.10
|
||||
conda activate handbook
|
||||
# install torch
|
||||
mamba install pytorch torchvision torchaudio pytorch-cuda=12.4 -c pytorch -c nvidia
|
||||
# # git clone https://github.com/princeton-nlp/SimPO.git
|
||||
|
||||
# install alignment handbook
|
||||
# or use .venv/src/alignment-handbook/
|
||||
git clone https://github.com/huggingface/alignment-handbook.git
|
||||
cd ./alignment-handbook/
|
||||
python -m pip install .
|
||||
python -m pip install flash-attn --no-build-isolation
|
||||
cd ..
|
||||
# # make env
|
||||
# conda create -n handbook python=3.10
|
||||
# conda activate handbook
|
||||
# # install torch
|
||||
# mamba install pytorch torchvision torchaudio pytorch-cuda=12.4 -c pytorch -c nvidia
|
||||
|
||||
# # install alignment handbook
|
||||
# # or use .venv/src/alignment-handbook/
|
||||
# git clone https://github.com/huggingface/alignment-handbook.git
|
||||
# cd ./alignment-handbook/
|
||||
# python -m pip install .
|
||||
# python -m pip install flash-attn --no-build-isolation
|
||||
# cd ..
|
||||
|
||||
Reference in New Issue
Block a user