Files
weight-steering/pyproject.toml
T
wassname 8ed3103e47 feat(authority): add authority behavior, logratio+SI metrics, prune dead code
- Add AUTHORITY_PROMPT + 3 persona pairs (MFT-paper framing, sl-identical)
- Wire authority into data._personas/_topics/_build_specs
- Add SINGLE_FOUNDATION + _axis_shift for single-foundation behaviors
- Add logratio to per-vignette/frame scoring (same convention as sl)
- Add _si.py: port si_per_foundation from sl foundations.py
- Drop prompt_baseline mode, repe, sycophancy, subspace, run_demo
- Strip kl_calibrate to dW-only; remove repe+prompt_texts deps
- Simplify replicate.py to train+diff only (no eval/demo/subspace)
- Default behavior="authority" across eval, sweep, replicate
- Install tinymfv git dep; flash_attn 2.6.3 prebuilt wheel

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
2026-05-03 14:04:23 +08:00

47 lines
1.0 KiB
TOML

[project]
name = "weight-steering"
version = "0.1.0"
description = "Fork of Anthropic's weight-steering: replicate, test SVD/subspace alignment, sweep PEFT adapter families."
requires-python = ">=3.11"
dependencies = [
"torch>=2.4",
"transformers>=4.46",
"peft>=0.13", # DeLoRA, DoRA, init_lora_weights="pissa"
"datasets>=3.0",
"accelerate>=1.0",
"einops>=0.8",
"jaxtyping>=0.2",
"beartype>=0.19",
"loguru>=0.7",
"polars>=1.10",
"tabulate>=0.9",
"wandb>=0.18",
"tyro>=0.8",
"baukit @ git+https://github.com/davidbau/baukit.git",
"tiny-mfv @ git+https://github.com/wassname/tinymfv",
]
[project.optional-dependencies]
dev = [
"pytest>=8",
"ipykernel>=6",
"ruff>=0.7",
]
[build-system]
requires = ["hatchling"]
build-backend = "hatchling.build"
[tool.hatch.metadata]
allow-direct-references = true
[tool.hatch.build.targets.wheel]
packages = ["src/ws"]
[tool.ruff]
line-length = 100
target-version = "py311"
[tool.uv]
exclude-newer = "5 days"