mirror of
https://github.com/wassname/evil_MoE.git
synced 2026-06-27 16:45:42 +08:00
cleanup: consolidate stale loaders and pair scripts
This commit is contained in:
@@ -357,6 +357,7 @@ extract-vhack-smoke:
|
||||
uv run python -m vgrout.extract_vhack_grad \
|
||||
--model=Qwen/Qwen3.5-0.8B \
|
||||
--dtype=bf16 \
|
||||
--pairs-from-pool=out/pairsets/prog_wide.json \
|
||||
--out-path=out/vhack/v_hack_smoke.safetensors \
|
||||
--train-grads-path=out/vhack_grads/vhack_grads_train_smoke.safetensors
|
||||
|
||||
@@ -364,6 +365,7 @@ extract-vhack-full:
|
||||
uv run python -m vgrout.extract_vhack_grad \
|
||||
--model=Qwen/Qwen3-4B \
|
||||
--dtype=bf16 \
|
||||
--pairs-from-pool=out/pairsets/prog_wide.json \
|
||||
--out-path=out/vhack/v_hack_full.safetensors \
|
||||
--train-grads-path=out/vhack_grads/vhack_grads_train_full.safetensors
|
||||
|
||||
@@ -371,6 +373,7 @@ verify-vhack-smoke:
|
||||
uv run python scripts/verify_vhack_heldout.py \
|
||||
--model=Qwen/Qwen3.5-0.8B \
|
||||
--dtype=bf16 \
|
||||
--pairs-path=out/pairsets/prog_wide.json \
|
||||
--v-hack-path=out/vhack/v_hack_smoke.safetensors \
|
||||
--out-path=out/vhack_heldout_cos_smoke.safetensors
|
||||
|
||||
@@ -378,6 +381,7 @@ verify-vhack-full:
|
||||
uv run python scripts/verify_vhack_heldout.py \
|
||||
--model=Qwen/Qwen3-4B \
|
||||
--dtype=bf16 \
|
||||
--pairs-path=out/pairsets/prog_wide.json \
|
||||
--v-hack-path=out/vhack/v_hack_full.safetensors \
|
||||
--out-path=out/vhack_heldout_cos_full.safetensors
|
||||
|
||||
|
||||
Reference in New Issue
Block a user