diff --git a/scripts/results.py b/scripts/results.py
index 5213582..83a57b7 100644
--- a/scripts/results.py
+++ b/scripts/results.py
@@ -79,6 +79,13 @@ def parse_log(path: Path) -> dict | None:
     if not hs:
         return None
     cfg = _cfg(argv, preset_line)
+    # GROUND TRUTH mix: train.py prints `mix_ratio=<x>` in the pool INFO line
+    # (what the run actually used). Many runs rely on the preset default and
+    # pass no --mix-ratio flag, so the argv-based grab in _cfg defaults to the
+    # wrong value (0.5) and mis-keys them. Override with the printed value.
+    m_mix = re.search(r"mix_ratio=([\d.]+)", txt)
+    if m_mix:
+        cfg["mix"] = m_mix.group(1)
     if "tiny-random" in cfg["model"] or cfg["preset"] == "smoke":
         return None  # CPU smoke runs, not real results
     if "probe" in cfg["tag"]: