diff --git a/scripts/results.py b/scripts/results.py index 5213582..83a57b7 100644 --- a/scripts/results.py +++ b/scripts/results.py @@ -79,6 +79,13 @@ def parse_log(path: Path) -> dict | None: if not hs: return None cfg = _cfg(argv, preset_line) + # GROUND TRUTH mix: train.py prints `mix_ratio=` in the pool INFO line + # (what the run actually used). Many runs rely on the preset default and + # pass no --mix-ratio flag, so the argv-based grab in _cfg defaults to the + # wrong value (0.5) and mis-keys them. Override with the printed value. + m_mix = re.search(r"mix_ratio=([\d.]+)", txt) + if m_mix: + cfg["mix"] = m_mix.group(1) if "tiny-random" in cfg["model"] or cfg["preset"] == "smoke": return None # CPU smoke runs, not real results if "probe" in cfg["tag"]: