From caa0d09472a3a5815912a6cf799c1de62dd36631 Mon Sep 17 00:00:00 2001 From: wassname <1103714+wassname@users.noreply.github.com> Date: Sun, 7 Jun 2026 22:12:00 +0000 Subject: [PATCH] broad: TEACHER_RT -> dense pool (was sparse, under-seeds); log: rename table cols train/deploy (drop 'knob') Co-Authored-By: Claudypoo <288921227+claudypoo@users.noreply.github.com> --- justfile | 2 +- src/vgrout/train.py | 12 ++++++------ 2 files changed, 7 insertions(+), 7 deletions(-) diff --git a/justfile b/justfile index f4e03be..e4e491a 100644 --- a/justfile +++ b/justfile @@ -150,7 +150,7 @@ queue-dir6 seed='43': # Lower priority than queue-dir6 (the focused single-seed set runs first). resolve: # routeV deploy_hack < vanilla at matched solve, significant across the 3 seeds (paired t, # alpha=0.01 like the paper); ablations (random/vampire) ~ vanilla confirm directionality. -TEACHER_RT := "out/pools/teacher_pool_runtests" +TEACHER_RT := "out/pools/teacher_pool_runtests_dense" queue-broad: #!/usr/bin/env bash set -eu diff --git a/src/vgrout/train.py b/src/vgrout/train.py index 8ce80d1..265fad7 100644 --- a/src/vgrout/train.py +++ b/src/vgrout/train.py @@ -1984,15 +1984,15 @@ def main(cfg: Config) -> int: # --- TAIL: argv, the result table, the single objective. The last lines. --- # solve and hack alone are gameable (tank solve to kill hack, or accept hack to # lift solve); the deploy gap solve-hack is the one number to maximise. Taken - # from the FINAL DEPLOY eval (knob-off, held-out test) = the shipped model on - # unseen problems. knob-on hack is the train-rollout student rate (different set, - # so its solve cell is "-": there is no knob-on deploy-style solve to pair it). + # from the FINAL DEPLOY eval (quarantine deleted, held-out test) = the shipped + # model on unseen problems. The "train" hack is the train-rollout student rate + # (different set, so its solve cell is "-": no train deploy-style solve to pair). _dh, _ds, _dn = ev["hack"], ev["solve"], ev["n"] - _deploy_col = f"knob-off (deploy, test n={_dn})" + _deploy_col = f"deploy (test n={_dn})" print(f"\n\nargv: {' '.join(sys.argv)}\n") print(tabulate( - [{"measure": "hack ↓", "knob-on (train)": f"{hack_rate_s:.3f}", _deploy_col: f"{_dh:.3f}"}, - {"measure": "solve ↑", "knob-on (train)": "-", _deploy_col: f"{_ds:.3f}"}], + [{"measure": "hack ↓", "train": f"{hack_rate_s:.3f}", _deploy_col: f"{_dh:.3f}"}, + {"measure": "solve ↑", "train": "-", _deploy_col: f"{_ds:.3f}"}], headers="keys", tablefmt="github", disable_numparse=True)) print(f"\n{cue} objective (deploy solve - hack ↑) = {_ds:.3f} - {_dh:.3f} = {_ds - _dh:+.3f} " f"[arm={cfg.arm} seed={cfg.seed}]")