Files
evil_MoE/pyproject.toml
T
wassname 42498682ca spec
2026-05-23 13:04:03 +08:00

50 lines
1.3 KiB
TOML

[project]
name = "projected_grpo"
version = "0.1.0"
description = "SVD-basis gradient projection vs RL reward hacking on Nanda's LeetCode benchmark"
requires-python = ">=3.11"
dependencies = [
"torch>=2.4",
# transformers>=4.58 has Qwen3.5 (model_type=qwen3_5, gated-delta-net).
# Per HF card: install from main if 4.58 not yet released. We pin to main
# via [tool.uv.sources] below; the version spec here is just a floor.
"transformers>=4.58.0.dev0",
"einops>=0.8",
"jaxtyping>=0.2",
"beartype>=0.18",
"loguru>=0.7",
"polars>=1.0",
"tabulate>=0.9",
"tyro>=0.8",
"tqdm>=4.66",
"numpy<2.0",
"datasets>=3.0",
"huggingface_hub>=0.24",
"wandb>=0.18",
"peft>=0.13",
]
[project.optional-dependencies]
gpu = [
"vllm>=0.10",
]
[tool.ruff.lint]
ignore = ["F722"] # jaxtyping shape strings
[build-system]
requires = ["setuptools>=68"]
build-backend = "setuptools.build_meta"
[tool.setuptools.packages.find]
where = ["src"]
[tool.uv]
exclude-newer = "2026-05-23"
[tool.uv.sources]
# Qwen3.5 (qwen3_5 model_type, gated-delta-net) lands in transformers main; pin
# until 4.58 release. v5.7.0 changelog note: "incorrect cached forward behavior
# in Qwen3.5's gated-delta-net linear attention" — fixed on main.
transformers = { git = "https://github.com/huggingface/transformers.git", rev = "main" }