From 80220a63eed0be37500aafd5aa8ca2e1c7e7d4cc Mon Sep 17 00:00:00 2001
From: Dima Molodenskiy <dmolodenskiy@embl-hamburg.de>
Date: Wed, 27 May 2026 13:56:23 +0200
Subject: [PATCH 01/15] Add interface meta_score module

Introduces a transparent, rank-style metascore that converts each of the
10 selected AlphaJudge interface features (LIS, ipSAE, pDockQ2, ipTM,
confidence, average interface PAE, pDockQ/mpDockQ, shape complementarity,
interface area, solvation energy) to its percentile against the frozen
benchmark_26 reference distribution and averages them. PAE and solvation
energy are sign-flipped so that higher percentile always means stronger
interaction evidence, and missing or non-finite inputs are ignored.

Reference deciles are baked into BENCHMARK_QUANTILES so the score is
reproducible and independent of any per-call benchmark file. Helper
calibrated_feature_percentile() can also be called directly to obtain the
percentile for an individual feature.

The scoring runner now writes interface_meta_score alongside the existing
columns in interfaces.csv, so every per-run output has a single ranking
number ready for downstream sorting or reporting.

Tests in test/test_meta_score.py cover bounded output, NaN handling,
direction of inverted features, and clamping at the unit interval.
---
 src/alphajudge/meta_score.py | 240 +++++++++++++++++++++++++++++++++++
 src/alphajudge/runner.py     |  13 +-
 test/test_meta_score.py      |  58 +++++++++
 3 files changed, 305 insertions(+), 6 deletions(-)
 create mode 100644 src/alphajudge/meta_score.py
 create mode 100644 test/test_meta_score.py

diff --git a/src/alphajudge/meta_score.py b/src/alphajudge/meta_score.py
new file mode 100644
index 00000000..89ed1284
--- /dev/null
+++ b/src/alphajudge/meta_score.py
@@ -0,0 +1,240 @@
+from __future__ import annotations
+
+import math
+from bisect import bisect_right
+from collections.abc import Mapping
+from typing import Any
+
+META_SCORE_FEATURES = (
+    "interface_LIS",
+    "interface_ipSAE",
+    "interface_pDockQ2",
+    "iptm",
+    "confidence_score",
+    "average_interface_pae",
+    "pDockQ/mpDockQ",
+    "interface_sc",
+    "interface_area",
+    "interface_solv_en",
+)
+
+FEATURE_DIRECTIONS = {
+    "interface_LIS": 1.0,
+    "interface_ipSAE": 1.0,
+    "interface_pDockQ2": 1.0,
+    "iptm": 1.0,
+    "confidence_score": 1.0,
+    "average_interface_pae": -1.0,
+    "pDockQ/mpDockQ": 1.0,
+    "interface_sc": 1.0,
+    "interface_area": 1.0,
+    "interface_solv_en": -1.0,
+}
+
+CALIBRATION_LEVELS = (
+    0.0,
+    0.1,
+    0.2,
+    0.3,
+    0.4,
+    0.5,
+    0.6,
+    0.7,
+    0.8,
+    0.9,
+    1.0,
+)
+
+# Frozen deciles from the benchmark_26 all-organism best-interface run
+# (7,345 AF2/AF3 positive/negative rows; April 22, 2026 merged table).
+# Values are already oriented so larger is better; e.g. PAE and solvation
+# energy are stored after sign flip.
+BENCHMARK_QUANTILES = {
+    "interface_LIS": (
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.059720202020202,
+        0.16705226076310281,
+        0.29334500115446349,
+        0.40119327202506005,
+        0.51623890758784829,
+        0.75338038596492163,
+    ),
+    "interface_ipSAE": (
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.0,
+        0.0131470059312316,
+        0.10584161048830307,
+        0.43384587935260738,
+        0.64412107036419464,
+        0.77087459523243229,
+        0.95559878883735405,
+    ),
+    "interface_pDockQ2": (
+        0.0075494887493505998,
+        0.0089492092351328,
+        0.0093933511858568398,
+        0.0098769987230639799,
+        0.010703449712070559,
+        0.0124802347229461,
+        0.018771163348387087,
+        0.050761707493646967,
+        0.17282606942497017,
+        0.47580370600410854,
+        0.95042261592369204,
+    ),
+    "iptm": (
+        0.040000000000000001,
+        0.14999999999999999,
+        0.17999999999999999,
+        0.21093810200691221,
+        0.25285084247589107,
+        0.31,
+        0.40999999999999998,
+        0.53254582881927492,
+        0.67266757488250806,
+        0.81000000000000005,
+        0.97108757495880116,
+    ),
+    "confidence_score": (
+        0.12678638003217149,
+        0.23979955960633545,
+        0.28000000000000003,
+        0.32000000000000001,
+        0.37,
+        0.42999999999999999,
+        0.51000000000000001,
+        0.61354833086340177,
+        0.73788607560146302,
+        0.84101645584207918,
+        1.1499999999999999,
+    ),
+    "average_interface_pae": (
+        -31.5,
+        -27.859964220839984,
+        -26.073899561846982,
+        -24.438900954877365,
+        -22.36344086021505,
+        -20.006129032258062,
+        -16.573059698130209,
+        -11.591519818964887,
+        -6.7923660714285621,
+        -3.6440909090909086,
+        -1.0446969696969697,
+    ),
+    "pDockQ/mpDockQ": (
+        0.018258893561979499,
+        0.048401733659705799,
+        0.080583999776873999,
+        0.11763635331753999,
+        0.1609442064816457,
+        0.21622604840653531,
+        0.28893407672657195,
+        0.39005367493568538,
+        0.502151558453238,
+        0.62055885656958631,
+        0.74034050365479986,
+    ),
+    "interface_sc": (
+        -0.20978600009076619,
+        0.19474781603546867,
+        0.25907145776977002,
+        0.32226136048686279,
+        0.38997362215252516,
+        0.42865133273885592,
+        0.46107348285381024,
+        0.49758078915313065,
+        0.54187397531551566,
+        0.59373881458964451,
+        0.74402412409164909,
+    ),
+    "interface_area": (
+        12.696379714313343,
+        581.59180907251502,
+        830.76128351670551,
+        1067.0180525575927,
+        1311.9445584680248,
+        1586.0792814579392,
+        1912.6781164897349,
+        2333.6612364858556,
+        2898.2619149565764,
+        3914.9127720160723,
+        23847.404872232858,
+    ),
+    "interface_solv_en": (
+        -26.140681977743796,
+        0.38162628724614497,
+        3.1598266879255246,
+        5.8459112057851663,
+        8.5967875314312085,
+        11.475426312687474,
+        15.228084355320659,
+        20.067672952580592,
+        27.302842021122294,
+        39.330244540335536,
+        400.66271273444442,
+    ),
+}
+
+
+def _safe_float(value: Any) -> float:
+    try:
+        parsed = float(value)
+    except (TypeError, ValueError):
+        return float("nan")
+    return parsed if math.isfinite(parsed) else float("nan")
+
+
+def calibrated_feature_percentile(feature: str, value: Any) -> float | None:
+    """Map a raw feature value onto the frozen benchmark percentile scale."""
+    if feature not in BENCHMARK_QUANTILES:
+        raise KeyError(f"unknown metascore feature: {feature}")
+
+    raw = _safe_float(value)
+    if math.isnan(raw):
+        return None
+
+    oriented = raw * FEATURE_DIRECTIONS[feature]
+    quantiles = BENCHMARK_QUANTILES[feature]
+    levels = CALIBRATION_LEVELS
+
+    if oriented <= quantiles[0]:
+        return levels[0]
+    if oriented >= quantiles[-1]:
+        return levels[-1]
+
+    lower_idx = bisect_right(quantiles, oriented) - 1
+    lower_idx = max(0, min(lower_idx, len(quantiles) - 2))
+    q0 = quantiles[lower_idx]
+    q1 = quantiles[lower_idx + 1]
+    p0 = levels[lower_idx]
+    p1 = levels[lower_idx + 1]
+
+    if oriented == q0 or q1 <= q0:
+        return p0
+    fraction = (oriented - q0) / (q1 - q0)
+    return p0 + fraction * (p1 - p0)
+
+
+def interface_meta_score(row: Mapping[str, Any]) -> float:
+    """
+    Transparent rank-style interface metascore.
+
+    Each selected AlphaJudge feature is converted to a frozen benchmark
+    percentile where higher means stronger interaction evidence. Missing or
+    non-finite inputs are ignored. The final score is the mean percentile.
+    """
+    percentiles = [
+        percentile
+        for feature in META_SCORE_FEATURES
+        if (percentile := calibrated_feature_percentile(feature, row.get(feature))) is not None
+    ]
+    if not percentiles:
+        return float("nan")
+    return float(sum(percentiles) / len(percentiles))
diff --git a/src/alphajudge/runner.py b/src/alphajudge/runner.py
index 9f75ba2f..a94f5af4 100644
--- a/src/alphajudge/runner.py
+++ b/src/alphajudge/runner.py
@@ -14,6 +14,7 @@
 
 from .parsers import pick_parser
 from .complex import Complex
+from .meta_score import interface_meta_score
 
 logger = logging.getLogger(__name__)
 
@@ -101,8 +102,7 @@ def process(
                     f"{iface.chain1[0].get_parent().id}_{iface.chain2[0].get_parent().id}"
                 )
                 iptm_val = iface.iptm_chainpair if iface.iptm_chainpair is not None else confidence.iptm
-                
-                row_data = {
+                row = {
                     "jobs": job,
                     "model_used": m,
                     "interface": label,
@@ -129,10 +129,10 @@ def process(
                     "interface_ipSAE": iface.ipsae(),
                     "interface_LIS": iface.lis(),
                 }
-                
+
                 # Add expensive metrics only if not skipped
                 if not skip_biophysical_scores:
-                    row_data.update({
+                    row.update({
                         "interface_hb": iface.hb,
                         "interface_sb": iface.sb,
                         "interface_ss": iface.ss,
@@ -140,8 +140,9 @@ def process(
                         "interface_area": iface.int_area,
                         "interface_solv_en": iface.int_solv_en,
                     })
-                
-                rows.append(row_data)
+
+                row["interface_meta_score"] = interface_meta_score(row)
+                rows.append(row)
 
             # Compute chain boundaries for separator lines on PAE heatmap
             chain_boundaries: list[float] = []
diff --git a/test/test_meta_score.py b/test/test_meta_score.py
new file mode 100644
index 00000000..e47809f8
--- /dev/null
+++ b/test/test_meta_score.py
@@ -0,0 +1,58 @@
+from __future__ import annotations
+
+import math
+
+from alphajudge.meta_score import (
+    META_SCORE_FEATURES,
+    calibrated_feature_percentile,
+    interface_meta_score,
+)
+
+
+def _complete_row() -> dict[str, float]:
+    return {
+        "interface_LIS": 0.30,
+        "interface_ipSAE": 0.45,
+        "interface_pDockQ2": 0.06,
+        "iptm": 0.55,
+        "confidence_score": 0.62,
+        "average_interface_pae": 10.0,
+        "pDockQ/mpDockQ": 0.40,
+        "interface_sc": 0.50,
+        "interface_area": 2300.0,
+        "interface_solv_en": -32.0,
+    }
+
+
+def test_meta_score_is_bounded_for_complete_row() -> None:
+    score = interface_meta_score(_complete_row())
+
+    assert 0.0 <= score <= 1.0
+
+
+def test_meta_score_ignores_missing_or_nan_inputs() -> None:
+    row = {feature: float("nan") for feature in META_SCORE_FEATURES}
+    row["interface_LIS"] = 0.30
+
+    assert interface_meta_score(row) == calibrated_feature_percentile("interface_LIS", 0.30)
+
+
+def test_meta_score_returns_nan_when_all_inputs_missing() -> None:
+    assert math.isnan(interface_meta_score({}))
+
+
+def test_inverted_features_score_in_the_expected_direction() -> None:
+    low_pae = calibrated_feature_percentile("average_interface_pae", 4.0)
+    high_pae = calibrated_feature_percentile("average_interface_pae", 30.0)
+    strong_solvation = calibrated_feature_percentile("interface_solv_en", -50.0)
+    weak_solvation = calibrated_feature_percentile("interface_solv_en", -5.0)
+
+    assert low_pae is not None and high_pae is not None
+    assert strong_solvation is not None and weak_solvation is not None
+    assert low_pae > high_pae
+    assert strong_solvation > weak_solvation
+
+
+def test_feature_percentiles_clamp_to_unit_interval() -> None:
+    assert calibrated_feature_percentile("interface_LIS", -1.0) == 0.0
+    assert calibrated_feature_percentile("interface_LIS", 10.0) == 1.0

From 12f944084b984cb88ef36e7bd68cc581cfa27e0c Mon Sep 17 00:00:00 2001
From: Dima Molodenskiy <dmolodenskiy@embl-hamburg.de>
Date: Wed, 27 May 2026 13:56:47 +0200
Subject: [PATCH 02/15] Add RCSB-style validation report module

Generates PDF reports that visualise each AlphaJudge interface metric as a
percentile slider against the frozen benchmark_26 reference deciles,
mirroring the wwPDB "Overall quality at a glance" layout: smooth red ->
yellow -> green gradient bars with a single black marker, serif
typography, page header rule with title/entry id, and a "Continued on
next page" footer.

Public API:
  - generate_per_run_report(run_dir) writes report.pdf next to
    interfaces.csv with a cover, an overall slider panel, a per-interface
    table, the PAE heatmap, and one per-model appendix page per non-best
    sample.
  - generate_aggregate_report(summary_csv) writes a multi-page PDF with a
    cohort cover (meta-score histogram, summary statistics, top-N table)
    plus one slider page per complex, ranked by interface_meta_score.
  - main_aggregate() exposes both modes through the alphajudge-report CLI
    (wired in a follow-up commit).

Tests cover per-run + aggregate generation, the missing-CSV fallback,
and the fallback that recomputes the meta score when an input row is
missing the precomputed interface_meta_score column.
---
 src/alphajudge/report.py | 1440 ++++++++++++++++++++++++++++++++++++++
 test/test_report.py      |  122 ++++
 2 files changed, 1562 insertions(+)
 create mode 100644 src/alphajudge/report.py
 create mode 100644 test/test_report.py

diff --git a/src/alphajudge/report.py b/src/alphajudge/report.py
new file mode 100644
index 00000000..e386d215
--- /dev/null
+++ b/src/alphajudge/report.py
@@ -0,0 +1,1440 @@
+"""RCSB-style validation reports for AlphaJudge interface scores.
+
+The visual layout mirrors the wwPDB / RCSB "Full Validation Report" PDF
+(see e.g. ``https://files.rcsb.org/validation/view/<id>_full_validation.pdf``):
+
+* serif typography (DejaVu Serif, the available Computer-Modern lookalike);
+* a smooth red -> yellow -> green percentile slider with a single black
+  marker for the entry's archive percentile;
+* a numbered "Overall quality at a glance" page with a metric/value table;
+* a page header rule with title + page number + entry id, and a
+  bottom rule with a "Continued on next page" note.
+
+Two entry points:
+
+* :func:`generate_per_run_report` -- one ``report.pdf`` per run directory.
+* :func:`generate_aggregate_report` -- a multi-page PDF over a merged CSV.
+"""
+
+from __future__ import annotations
+
+import csv
+import logging
+import math
+from collections import OrderedDict
+from collections.abc import Mapping, Sequence
+from datetime import datetime
+from pathlib import Path
+from typing import Any
+
+import matplotlib
+
+matplotlib.use("Agg")
+import matplotlib.image as mpimg
+import matplotlib.pyplot as plt
+import numpy as np
+from matplotlib.backends.backend_pdf import PdfPages
+from matplotlib.patches import FancyBboxPatch, Rectangle
+
+from .meta_score import (
+    BENCHMARK_QUANTILES,
+    CALIBRATION_LEVELS,
+    FEATURE_DIRECTIONS,
+    META_SCORE_FEATURES,
+    calibrated_feature_percentile,
+    interface_meta_score,
+)
+
+logger = logging.getLogger(__name__)
+
+_A4 = (8.27, 11.69)
+_SLIDER_CMAP = "RdYlGn"
+_INFO_BG = "#fbe5e5"
+_INFO_EDGE = "#a83232"
+_HEADER_RULE = "#3a3a3a"
+_TABLE_RULE = "#404040"
+
+_REPORT_TITLE = "AlphaJudge Interface Validation Report"
+_BENCHMARK_TAG = "benchmark_26 (final_sync_20260523, n=7,756 AF2/AF3 rows)"
+
+_FEATURE_DISPLAY = {
+    "interface_LIS": "Interface LIS",
+    "interface_ipSAE": "Interface ipSAE",
+    "interface_pDockQ2": "Interface pDockQ2",
+    "iptm": "ipTM",
+    "confidence_score": "Confidence score",
+    "average_interface_pae": "Avg. interface PAE",
+    "pDockQ/mpDockQ": "pDockQ / mpDockQ",
+    "interface_sc": "Shape complementarity",
+    "interface_area": "Interface area",
+    "interface_solv_en": "Solvation energy",
+}
+
+_FEATURE_UNITS = {
+    "average_interface_pae": "Å",
+    "interface_area": "Å²",
+    "interface_solv_en": "kcal/mol",
+}
+
+
+# ---------------------------------------------------------------------------
+# style + utility helpers
+# ---------------------------------------------------------------------------
+
+def _setup_rcparams() -> None:
+    rcparams = {
+        "font.family": "serif",
+        "font.serif": ["DejaVu Serif", "Times New Roman", "Times"],
+        "mathtext.fontset": "dejavuserif",
+        "axes.titlesize": 11,
+        "axes.labelsize": 9,
+        "axes.spines.top": False,
+        "axes.spines.right": False,
+        "xtick.labelsize": 8,
+        "ytick.labelsize": 8,
+        "axes.edgecolor": "#222222",
+        "savefig.dpi": 200,
+    }
+    matplotlib.rcParams.update(rcparams)
+
+
+def _safe_float(value: Any) -> float | None:
+    try:
+        parsed = float(value)
+    except (TypeError, ValueError):
+        return None
+    return parsed if math.isfinite(parsed) else None
+
+
+def _read_csv_rows(path: Path) -> list[dict[str, str]]:
+    with path.open() as fh:
+        return list(csv.DictReader(fh))
+
+
+def _row_meta_score(row: Mapping[str, Any]) -> float | None:
+    direct = _safe_float(row.get("interface_meta_score"))
+    if direct is not None:
+        return direct
+    computed = interface_meta_score(row)
+    if isinstance(computed, float) and math.isfinite(computed):
+        return computed
+    return None
+
+
+def _feature_view(row: Mapping[str, Any]) -> "OrderedDict[str, tuple[float | None, float | None]]":
+    view: "OrderedDict[str, tuple[float | None, float | None]]" = OrderedDict()
+    for feat in META_SCORE_FEATURES:
+        raw = _safe_float(row.get(feat))
+        pct = calibrated_feature_percentile(feat, raw) if raw is not None else None
+        view[feat] = (raw, pct)
+    return view
+
+
+def _best_row(rows: Sequence[Mapping[str, Any]]) -> Mapping[str, Any] | None:
+    best: tuple[float, Mapping[str, Any]] | None = None
+    for r in rows:
+        s = _row_meta_score(r)
+        if s is None:
+            continue
+        if best is None or s > best[0]:
+            best = (s, r)
+    if best is not None:
+        return best[1]
+    return rows[0] if rows else None
+
+
+def _group_complex_rows(rows: Sequence[Mapping[str, Any]]) -> "OrderedDict[str, list[Mapping[str, Any]]]":
+    grouped: "OrderedDict[str, list[Mapping[str, Any]]]" = OrderedDict()
+    for r in rows:
+        key = str(r.get("jobs") or r.get("pair") or r.get("complex") or "")
+        if not key:
+            continue
+        grouped.setdefault(key, []).append(r)
+    return grouped
+
+
+def _format_raw(value: float | None, *, decimals: int = 3) -> str:
+    if value is None:
+        return "—"
+    av = abs(value)
+    if av != 0.0 and (av >= 10000 or av < 0.001):
+        return f"{value:.2e}"
+    if av >= 100:
+        return f"{value:.1f}"
+    return f"{value:.{decimals}g}"
+
+
+def _truncate(text: str, max_len: int) -> str:
+    if len(text) <= max_len:
+        return text
+    return text[: max_len - 1] + "…"
+
+
+def _shorten_path(path: str, max_len: int = 64) -> str:
+    if len(path) <= max_len:
+        return path
+    head = path[: max_len // 2 - 1]
+    tail = path[-(max_len // 2):]
+    return f"{head}…{tail}"
+
+
+def _detect_backend(rows: Sequence[Mapping[str, Any]]) -> str:
+    for r in rows:
+        model = str(r.get("model_used") or "")
+        if "multimer" in model.lower():
+            return "AlphaFold 2"
+        if model.startswith("seed-") or "_sample-" in model:
+            return "AlphaFold 3"
+        if "boltz" in model.lower():
+            return "Boltz-2"
+    return "unknown"
+
+
+def _detect_chain_set(rows: Sequence[Mapping[str, Any]]) -> set[str]:
+    chains: set[str] = set()
+    for r in rows:
+        iface = str(r.get("interface") or "")
+        for part in iface.split("_"):
+            if part:
+                chains.add(part)
+    return chains
+
+
+def _decile_label(pct: float | None) -> str:
+    if pct is None:
+        return "n/a"
+    if pct >= 0.9:
+        return "Top decile"
+    if pct >= 0.75:
+        return "Upper quartile"
+    if pct >= 0.5:
+        return "Above median"
+    if pct >= 0.25:
+        return "Below median"
+    if pct >= 0.1:
+        return "Lower quartile"
+    return "Bottom decile"
+
+
+# ---------------------------------------------------------------------------
+# page primitives
+# ---------------------------------------------------------------------------
+
+def _new_figure() -> plt.Figure:
+    return plt.figure(figsize=_A4, facecolor="white")
+
+
+def _add_page_header(fig: plt.Figure, *, page_no: int, total: int, title: str, entry: str) -> None:
+    ax = fig.add_axes((0.07, 0.965, 0.86, 0.018))
+    ax.axis("off")
+    ax.text(0.0, 0.5, f"Page {page_no}", fontsize=8, color="#333", va="center", transform=ax.transAxes)
+    ax.text(0.5, 0.5, title, fontsize=8, color="#333", va="center", ha="center", transform=ax.transAxes)
+    ax.text(1.0, 0.5, entry, fontsize=8, color="#333", va="center", ha="right", transform=ax.transAxes)
+    rule = fig.add_axes((0.07, 0.957, 0.86, 0.003))
+    rule.axis("off")
+    rule.axhline(0.5, color=_HEADER_RULE, linewidth=0.8)
+
+
+def _add_page_footer(fig: plt.Figure, *, page_no: int, total: int, last: bool) -> None:
+    rule = fig.add_axes((0.07, 0.038, 0.86, 0.003))
+    rule.axis("off")
+    rule.axhline(0.5, color=_HEADER_RULE, linewidth=0.6)
+    ax = fig.add_axes((0.07, 0.018, 0.86, 0.018))
+    ax.axis("off")
+    if not last and page_no < total:
+        ax.text(
+            0.5,
+            0.5,
+            "Continued on next page…",
+            ha="center",
+            va="center",
+            fontsize=8,
+            color="#666",
+            style="italic",
+            transform=ax.transAxes,
+        )
+    ax.text(
+        1.0,
+        0.5,
+        f"{page_no} / {total}",
+        ha="right",
+        va="center",
+        fontsize=8,
+        color="#555",
+        transform=ax.transAxes,
+    )
+    ax.text(
+        0.0,
+        0.5,
+        "AlphaJudge",
+        ha="left",
+        va="center",
+        fontsize=8,
+        color="#555",
+        transform=ax.transAxes,
+    )
+
+
+def _draw_info_box(fig: plt.Figure, *, x: float, y: float, w: float, h: float, lines: Sequence[str]) -> None:
+    ax = fig.add_axes((x, y, w, h))
+    ax.set_xlim(0, 1)
+    ax.set_ylim(0, 1)
+    ax.axis("off")
+    box = FancyBboxPatch(
+        (0.005, 0.05),
+        0.99,
+        0.90,
+        boxstyle="round,pad=0.02,rounding_size=0.02",
+        linewidth=0.6,
+        edgecolor=_INFO_EDGE,
+        facecolor=_INFO_BG,
+        transform=ax.transAxes,
+    )
+    ax.add_patch(box)
+    n = len(lines)
+    if n == 0:
+        return
+    top = 0.83
+    line_h = 0.7 / max(1, n)
+    for i, line in enumerate(lines):
+        ax.text(
+            0.5,
+            top - i * line_h,
+            line,
+            ha="center",
+            va="top",
+            fontsize=9.5,
+            color="#1d1d1d",
+            transform=ax.transAxes,
+        )
+
+
+def _draw_meta_block(fig: plt.Figure, *, x: float, y: float, w: float, h: float, pairs: Sequence[tuple[str, str]]) -> None:
+    """Right-aligned label, colon, then value (RCSB style)."""
+    ax = fig.add_axes((x, y, w, h))
+    ax.set_xlim(0, 1)
+    ax.set_ylim(0, 1)
+    ax.axis("off")
+    n = len(pairs)
+    if n == 0:
+        return
+    top = 0.92
+    line_h = 0.85 / max(1, n)
+    label_x = 0.36
+    sep_x = 0.40
+    val_x = 0.44
+    for i, (label, value) in enumerate(pairs):
+        ypos = top - i * line_h
+        ax.text(label_x, ypos, label, fontsize=10.5, ha="right", va="top", transform=ax.transAxes)
+        ax.text(sep_x, ypos, ":", fontsize=10.5, ha="center", va="top", transform=ax.transAxes)
+        ax.text(val_x, ypos, value, fontsize=10.5, ha="left", va="top", transform=ax.transAxes)
+
+
+def _draw_section_heading(fig: plt.Figure, *, x: float, y: float, w: float, h: float, number: str, title: str) -> None:
+    ax = fig.add_axes((x, y, w, h))
+    ax.axis("off")
+    ax.text(
+        0.0,
+        0.4,
+        f"{number}  {title}",
+        fontsize=15,
+        fontweight="bold",
+        color="#101010",
+        transform=ax.transAxes,
+    )
+
+
+# ---------------------------------------------------------------------------
+# slider primitive
+# ---------------------------------------------------------------------------
+
+_GRADIENT = np.tile(np.linspace(0.02, 0.98, 512), (4, 1))
+
+
+def _draw_slider_bar(
+    ax,
+    percentile: float | None,
+    *,
+    cmap: str = _SLIDER_CMAP,
+    show_axis: bool = False,
+) -> None:
+    """RCSB-style horizontal percentile bar with a single black marker."""
+
+    ax.imshow(
+        _GRADIENT,
+        aspect="auto",
+        cmap=cmap,
+        extent=(0.0, 1.0, 0.0, 1.0),
+        interpolation="bilinear",
+    )
+    ax.set_xlim(0.0, 1.0)
+    ax.set_ylim(0.0, 1.0)
+    ax.set_yticks([])
+    if show_axis:
+        ax.set_xticks([0.0, 0.25, 0.5, 0.75, 1.0])
+        ax.set_xticklabels(["0", "25", "50", "75", "100"], fontsize=7)
+        ax.tick_params(axis="x", length=2, pad=1, colors="#333333")
+    else:
+        ax.set_xticks([])
+
+    for spine in ax.spines.values():
+        spine.set_visible(True)
+        spine.set_edgecolor("#1a1a1a")
+        spine.set_linewidth(0.6)
+
+    if percentile is not None:
+        ax.add_patch(
+            Rectangle(
+                (max(0.0, min(1.0, percentile)) - 0.005, -0.10),
+                0.010,
+                1.20,
+                color="#0e0e0e",
+                clip_on=False,
+                zorder=5,
+            )
+        )
+
+
+_LAYOUT = {
+    "left": 0.085,
+    "label_width": 0.190,
+    "gap_label_slider": 0.012,
+    "slider_width": 0.460,
+    "gap_slider_pct": 0.014,
+    "pct_width": 0.045,
+    "gap_pct_value": 0.010,
+    "value_width": 0.115,
+}
+
+
+def _draw_slider_row(
+    fig: plt.Figure,
+    *,
+    bottom: float,
+    height: float,
+    label: str,
+    raw: float | None,
+    pct: float | None,
+    units: str = "",
+    show_axis: bool = False,
+) -> None:
+    L = _LAYOUT
+    x = L["left"]
+    label_ax = fig.add_axes((x, bottom, L["label_width"], height))
+    label_ax.axis("off")
+    label_ax.text(
+        1.0,
+        0.5,
+        label,
+        fontsize=10,
+        ha="right",
+        va="center",
+        transform=label_ax.transAxes,
+    )
+    x += L["label_width"] + L["gap_label_slider"]
+
+    slider_ax = fig.add_axes(
+        (
+            x,
+            bottom + (0.20 if not show_axis else 0.30) * height,
+            L["slider_width"],
+            (0.55 if not show_axis else 0.42) * height,
+        )
+    )
+    _draw_slider_bar(slider_ax, pct, show_axis=show_axis)
+    x += L["slider_width"] + L["gap_slider_pct"]
+
+    pct_ax = fig.add_axes((x, bottom + 0.18 * height, L["pct_width"], 0.64 * height))
+    pct_ax.set_xlim(0, 1)
+    pct_ax.set_ylim(0, 1)
+    pct_ax.axis("off")
+    pct_text = "n/a" if pct is None else f"{pct * 100:0.0f}%"
+    pct_ax.text(
+        0.5,
+        0.5,
+        pct_text,
+        ha="center",
+        va="center",
+        fontsize=9,
+        color="#222222",
+        transform=pct_ax.transAxes,
+    )
+    x += L["pct_width"] + L["gap_pct_value"]
+
+    value_ax = fig.add_axes((x, bottom + 0.18 * height, L["value_width"], 0.64 * height))
+    value_ax.set_xlim(0, 1)
+    value_ax.set_ylim(0, 1)
+    value_ax.set_xticks([])
+    value_ax.set_yticks([])
+    for spine in value_ax.spines.values():
+        spine.set_edgecolor("#5a5a5a")
+        spine.set_linewidth(0.6)
+    raw_text = _format_raw(raw)
+    if units:
+        raw_text = f"{raw_text} {units}"
+    value_ax.text(
+        0.5,
+        0.5,
+        raw_text,
+        ha="center",
+        va="center",
+        fontsize=9,
+        transform=value_ax.transAxes,
+    )
+
+
+def _draw_slider_panel(
+    fig: plt.Figure,
+    *,
+    top: float,
+    height: float,
+    row: Mapping[str, Any],
+    include_overall: bool = True,
+) -> None:
+    """RCSB-style 'Metric | Percentile rank | %ile | Value' table."""
+
+    rows: list[tuple[str, float | None, float | None, str]] = []
+    if include_overall:
+        score = _row_meta_score(row)
+        rows.append(("Overall meta score", score, score, ""))
+    fv = _feature_view(row)
+    for feat in META_SCORE_FEATURES:
+        raw, pct = fv[feat]
+        rows.append((_FEATURE_DISPLAY.get(feat, feat), raw, pct, _FEATURE_UNITS.get(feat, "")))
+
+    L = _LAYOUT
+    header_y = top
+    body_top = top - 0.024
+    n_rows = len(rows)
+    body_height = height - 0.024
+    row_h = body_height / n_rows
+
+    # Header band
+    band = fig.add_axes(
+        (
+            L["left"],
+            header_y - 0.022,
+            L["label_width"] + L["gap_label_slider"] + L["slider_width"] + L["gap_slider_pct"]
+            + L["pct_width"] + L["gap_pct_value"] + L["value_width"],
+            0.022,
+        )
+    )
+    band.set_xlim(0, 1)
+    band.set_ylim(0, 1)
+    band.axis("off")
+    band.add_patch(Rectangle((0.0, 0.0), 1.0, 1.0, color="#efe9d8", transform=band.transAxes))
+
+    band_w = (
+        L["label_width"] + L["gap_label_slider"] + L["slider_width"]
+        + L["gap_slider_pct"] + L["pct_width"] + L["gap_pct_value"] + L["value_width"]
+    )
+
+    def _hx(col_start: float, col_w: float) -> float:
+        return (col_start - L["left"] + col_w / 2) / band_w
+
+    # Place header labels at column centers
+    band.text(
+        _hx(L["left"], L["label_width"]),
+        0.5,
+        "Metric",
+        fontsize=10,
+        fontweight="bold",
+        ha="center",
+        va="center",
+        transform=band.transAxes,
+    )
+    slider_start = L["left"] + L["label_width"] + L["gap_label_slider"]
+    band.text(
+        _hx(slider_start, L["slider_width"]),
+        0.5,
+        "Percentile rank",
+        fontsize=10,
+        fontweight="bold",
+        ha="center",
+        va="center",
+        transform=band.transAxes,
+    )
+    pct_start = slider_start + L["slider_width"] + L["gap_slider_pct"]
+    band.text(
+        _hx(pct_start, L["pct_width"]),
+        0.5,
+        "%",
+        fontsize=10,
+        fontweight="bold",
+        ha="center",
+        va="center",
+        transform=band.transAxes,
+    )
+    value_start = pct_start + L["pct_width"] + L["gap_pct_value"]
+    band.text(
+        _hx(value_start, L["value_width"]),
+        0.5,
+        "Value",
+        fontsize=10,
+        fontweight="bold",
+        ha="center",
+        va="center",
+        transform=band.transAxes,
+    )
+
+    for i, (label, raw, pct, units) in enumerate(rows):
+        row_bottom = body_top - (i + 1) * row_h
+        show_axis = i == n_rows - 1
+        _draw_slider_row(
+            fig,
+            bottom=row_bottom,
+            height=row_h * 0.92,
+            label=label,
+            raw=raw,
+            pct=pct,
+            units=units,
+            show_axis=show_axis,
+        )
+
+    bottom_y = body_top - n_rows * row_h
+    legend_ax = fig.add_axes((slider_start, bottom_y - 0.022, L["slider_width"], 0.018))
+    legend_ax.axis("off")
+    legend_ax.annotate(
+        "Worse",
+        xy=(0.0, 0.5),
+        xytext=(0.08, 0.5),
+        xycoords="axes fraction",
+        textcoords="axes fraction",
+        fontsize=8.5,
+        color="#7a1d1d",
+        va="center",
+        ha="left",
+        arrowprops=dict(arrowstyle="<-", color="#7a1d1d", lw=0.7),
+    )
+    legend_ax.annotate(
+        "Better",
+        xy=(1.0, 0.5),
+        xytext=(0.92, 0.5),
+        xycoords="axes fraction",
+        textcoords="axes fraction",
+        fontsize=8.5,
+        color="#1d5d1d",
+        va="center",
+        ha="right",
+        arrowprops=dict(arrowstyle="->", color="#1d5d1d", lw=0.7),
+    )
+
+
+# ---------------------------------------------------------------------------
+# compact, fixed-width tables (no matplotlib.table -- it truncates labels)
+# ---------------------------------------------------------------------------
+
+def _draw_fixed_table(
+    fig: plt.Figure,
+    *,
+    x: float,
+    y_top: float,
+    w: float,
+    headers: Sequence[str],
+    rows: Sequence[Sequence[str]],
+    col_fracs: Sequence[float],
+    row_height: float = 0.024,
+    header_color: str = "#efe9d8",
+    font_size: float = 8.5,
+) -> float:
+    """Draw a table anchored at top ``y_top``, growing downward.
+
+    Returns the bottom y of the table (figure fraction).
+    """
+
+    assert abs(sum(col_fracs) - 1.0) < 1e-6, "col_fracs must sum to 1"
+
+    n_rows = len(rows)
+    table_h = row_height * (n_rows + 1)
+    ax = fig.add_axes((x, y_top - table_h, w, table_h))
+    ax.set_xlim(0, 1)
+    ax.set_ylim(0, 1)
+    ax.axis("off")
+    if not rows:
+        ax.text(0.5, 0.5, "no data", ha="center", va="center", fontsize=10, color="#555")
+        return y_top - table_h
+
+    # Header row at the top of the axes
+    cell_h = 1.0 / (n_rows + 1)
+    header_top = 1.0
+    ax.add_patch(Rectangle((0.0, header_top - cell_h), 1.0, cell_h, color=header_color, zorder=1))
+    x_left = 0.0
+    for frac, label in zip(col_fracs, headers):
+        ax.add_patch(
+            Rectangle(
+                (x_left, header_top - cell_h),
+                frac,
+                cell_h,
+                fill=False,
+                edgecolor=_TABLE_RULE,
+                linewidth=0.5,
+                zorder=2,
+            )
+        )
+        ax.text(
+            x_left + frac / 2,
+            header_top - cell_h / 2,
+            label,
+            ha="center",
+            va="center",
+            fontsize=font_size + 0.5,
+            fontweight="bold",
+            color="#111111",
+            transform=ax.transAxes,
+        )
+        x_left += frac
+
+    # Approx max characters per column based on width and font size
+    inch_w = w * _A4[0]
+    max_chars_per_col = [max(4, int(frac * inch_w * 12)) for frac in col_fracs]
+
+    cur_y = header_top - cell_h
+    for r_idx, row_vals in enumerate(rows):
+        cell_bot = cur_y - cell_h
+        bg = "#ffffff" if r_idx % 2 == 0 else "#f6f6f0"
+        ax.add_patch(Rectangle((0.0, cell_bot), 1.0, cell_h, color=bg, zorder=1))
+        x_left = 0.0
+        for frac, cell, max_chars in zip(col_fracs, row_vals, max_chars_per_col):
+            ax.add_patch(
+                Rectangle(
+                    (x_left, cell_bot),
+                    frac,
+                    cell_h,
+                    fill=False,
+                    edgecolor=_TABLE_RULE,
+                    linewidth=0.4,
+                    zorder=2,
+                )
+            )
+            ax.text(
+                x_left + frac / 2,
+                cell_bot + cell_h / 2,
+                _truncate(str(cell), max_chars),
+                ha="center",
+                va="center",
+                fontsize=font_size,
+                color="#1a1a1a",
+                transform=ax.transAxes,
+            )
+            x_left += frac
+        cur_y = cell_bot
+
+    return y_top - table_h
+
+
+# ---------------------------------------------------------------------------
+# pages
+# ---------------------------------------------------------------------------
+
+def _cover_page(
+    pdf: PdfPages,
+    *,
+    title: str,
+    subtitle_lines: Sequence[str],
+    entry_id: str,
+    meta_pairs: Sequence[tuple[str, str]],
+    info_lines: Sequence[str],
+    software_lines: Sequence[tuple[str, str]],
+    page_no: int,
+    total: int,
+) -> None:
+    fig = _new_figure()
+    _add_page_header(fig, page_no=page_no, total=total, title=title, entry=entry_id)
+
+    title_ax = fig.add_axes((0.07, 0.85, 0.86, 0.06))
+    title_ax.axis("off")
+    title_ax.text(
+        0.5,
+        0.5,
+        title,
+        ha="center",
+        va="center",
+        fontsize=22,
+        fontweight="bold",
+        color="#101010",
+        transform=title_ax.transAxes,
+    )
+
+    sub_ax = fig.add_axes((0.07, 0.815, 0.86, 0.025))
+    sub_ax.axis("off")
+    sub_ax.text(
+        0.5,
+        0.5,
+        " – ".join(subtitle_lines),
+        ha="center",
+        va="center",
+        fontsize=11,
+        color="#1f1f1f",
+        transform=sub_ax.transAxes,
+    )
+
+    _draw_meta_block(fig, x=0.10, y=0.62, w=0.80, h=0.18, pairs=meta_pairs)
+    _draw_info_box(fig, x=0.13, y=0.43, w=0.74, h=0.16, lines=info_lines)
+
+    sw_ax = fig.add_axes((0.10, 0.20, 0.80, 0.18))
+    sw_ax.set_xlim(0, 1)
+    sw_ax.set_ylim(0, 1)
+    sw_ax.axis("off")
+    sw_ax.text(
+        0.0,
+        0.95,
+        "The following software and reference data were used in this report:",
+        fontsize=10,
+        ha="left",
+        va="top",
+        transform=sw_ax.transAxes,
+    )
+    n = len(software_lines)
+    if n:
+        top = 0.80
+        line_h = 0.68 / max(1, n)
+        for i, (k, v) in enumerate(software_lines):
+            ypos = top - i * line_h
+            sw_ax.text(0.40, ypos, k, fontsize=10, ha="right", va="top", transform=sw_ax.transAxes)
+            sw_ax.text(0.42, ypos, ":", fontsize=10, ha="center", va="top", transform=sw_ax.transAxes)
+            sw_ax.text(0.44, ypos, v, fontsize=10, ha="left", va="top", transform=sw_ax.transAxes)
+
+    _add_page_footer(fig, page_no=page_no, total=total, last=False)
+    pdf.savefig(fig)
+    plt.close(fig)
+
+
+def _quality_page(
+    pdf: PdfPages,
+    *,
+    title: str,
+    entry_id: str,
+    section_no: str,
+    section_title: str,
+    pre_lines: Sequence[str],
+    row: Mapping[str, Any],
+    page_no: int,
+    total: int,
+    last: bool = False,
+) -> None:
+    fig = _new_figure()
+    _add_page_header(fig, page_no=page_no, total=total, title=title, entry=entry_id)
+    _draw_section_heading(fig, x=0.07, y=0.91, w=0.86, h=0.03, number=section_no, title=section_title)
+    intro_ax = fig.add_axes((0.10, 0.79, 0.80, 0.11))
+    intro_ax.axis("off")
+    for i, line in enumerate(pre_lines):
+        intro_ax.text(
+            0.0,
+            0.95 - i * 0.18,
+            line,
+            fontsize=10,
+            ha="left",
+            va="top",
+            transform=intro_ax.transAxes,
+        )
+
+    _draw_slider_panel(fig, top=0.76, height=0.60, row=row, include_overall=True)
+
+    explanation_ax = fig.add_axes((0.10, 0.06, 0.80, 0.06))
+    explanation_ax.axis("off")
+    explanation_ax.text(
+        0.5,
+        0.9,
+        "Percentile ranks are computed against the AlphaJudge benchmark distribution; "
+        "higher is better for every metric (sign-flipped where needed).",
+        ha="center",
+        va="top",
+        fontsize=9,
+        color="#555",
+        transform=explanation_ax.transAxes,
+    )
+
+    _add_page_footer(fig, page_no=page_no, total=total, last=last)
+    pdf.savefig(fig)
+    plt.close(fig)
+
+
+def _per_interface_page(
+    pdf: PdfPages,
+    *,
+    title: str,
+    entry_id: str,
+    section_no: str,
+    rows: Sequence[Mapping[str, Any]],
+    page_no: int,
+    total: int,
+    last: bool = False,
+) -> None:
+    fig = _new_figure()
+    _add_page_header(fig, page_no=page_no, total=total, title=title, entry=entry_id)
+    _draw_section_heading(
+        fig, x=0.07, y=0.91, w=0.86, h=0.03,
+        number=section_no, title="Per-interface raw scores",
+    )
+
+    intro_ax = fig.add_axes((0.10, 0.84, 0.80, 0.05))
+    intro_ax.axis("off")
+    intro_ax.text(
+        0.0,
+        1.0,
+        "Each row is one chain pair detected by AlphaJudge. The Meta column is the "
+        "averaged percentile across the 10 metascore features (higher is better).",
+        fontsize=9,
+        ha="left",
+        va="top",
+        transform=intro_ax.transAxes,
+    )
+
+    headers = ["Model", "Interface", "Residues", "Meta", "LIS", "ipSAE", "pDockQ2", "ipTM", "PAE", "Sc"]
+    body: list[list[str]] = []
+    for r in rows:
+        body.append(
+            [
+                _truncate(str(r.get("model_used") or ""), 26),
+                str(r.get("interface") or ""),
+                str(r.get("interface_num_intf_residues") or ""),
+                _format_raw(_row_meta_score(r)),
+                _format_raw(_safe_float(r.get("interface_LIS"))),
+                _format_raw(_safe_float(r.get("interface_ipSAE"))),
+                _format_raw(_safe_float(r.get("interface_pDockQ2"))),
+                _format_raw(_safe_float(r.get("iptm"))),
+                _format_raw(_safe_float(r.get("average_interface_pae"))),
+                _format_raw(_safe_float(r.get("interface_sc"))),
+            ]
+        )
+
+    col_fracs = [0.21, 0.09, 0.08, 0.08, 0.08, 0.09, 0.10, 0.07, 0.08, 0.12]
+    _draw_fixed_table(
+        fig,
+        x=0.07,
+        y_top=0.80,
+        w=0.86,
+        headers=headers,
+        rows=body,
+        col_fracs=col_fracs,
+        row_height=0.026,
+    )
+
+    _add_page_footer(fig, page_no=page_no, total=total, last=last)
+    pdf.savefig(fig)
+    plt.close(fig)
+
+
+def _pae_page(
+    pdf: PdfPages,
+    *,
+    title: str,
+    entry_id: str,
+    section_no: str,
+    image_path: Path,
+    model_label: str,
+    page_no: int,
+    total: int,
+    last: bool = False,
+) -> None:
+    fig = _new_figure()
+    _add_page_header(fig, page_no=page_no, total=total, title=title, entry=entry_id)
+    _draw_section_heading(
+        fig, x=0.07, y=0.91, w=0.86, h=0.03,
+        number=section_no, title=f"Predicted Aligned Error – {model_label}",
+    )
+    img_ax = fig.add_axes((0.13, 0.10, 0.74, 0.78))
+    try:
+        img = mpimg.imread(str(image_path))
+        img_ax.imshow(img)
+    except Exception as e:
+        img_ax.text(0.5, 0.5, f"PAE image unavailable\n({e})", ha="center", va="center")
+    img_ax.set_xticks([])
+    img_ax.set_yticks([])
+    for spine in img_ax.spines.values():
+        spine.set_visible(False)
+    _add_page_footer(fig, page_no=page_no, total=total, last=last)
+    pdf.savefig(fig)
+    plt.close(fig)
+
+
+# ---------------------------------------------------------------------------
+# aggregate
+# ---------------------------------------------------------------------------
+
+def _aggregate_cover_page(
+    pdf: PdfPages,
+    *,
+    summary_csv: Path,
+    n_complexes: int,
+    n_rows: int,
+    scores: Sequence[float],
+    top_rows: Sequence[tuple[str, float, Mapping[str, Any]]],
+    backends: Mapping[str, int],
+    page_no: int,
+    total: int,
+) -> None:
+    fig = _new_figure()
+    _add_page_header(
+        fig, page_no=page_no, total=total,
+        title=_REPORT_TITLE, entry="Aggregate report",
+    )
+
+    title_ax = fig.add_axes((0.07, 0.87, 0.86, 0.06))
+    title_ax.axis("off")
+    title_ax.text(
+        0.5,
+        0.5,
+        _REPORT_TITLE,
+        fontsize=22,
+        fontweight="bold",
+        ha="center",
+        va="center",
+        transform=title_ax.transAxes,
+    )
+    sub_ax = fig.add_axes((0.07, 0.835, 0.86, 0.025))
+    sub_ax.axis("off")
+    sub_ax.text(
+        0.5,
+        0.5,
+        f"Aggregate report – {n_complexes} complexes",
+        ha="center",
+        va="center",
+        fontsize=11,
+        color="#1f1f1f",
+        transform=sub_ax.transAxes,
+    )
+
+    meta = [
+        ("Source", _shorten_path(str(summary_csv), max_len=58)),
+        ("Date", datetime.now().strftime("%Y-%m-%d %H:%M")),
+        ("Complexes", str(n_complexes)),
+        ("Interface rows", str(n_rows)),
+    ]
+    if backends:
+        meta.append(("Backends", ", ".join(f"{k}={v}" for k, v in backends.items())))
+    _draw_meta_block(fig, x=0.10, y=0.68, w=0.80, h=0.13, pairs=meta)
+
+    info = [
+        "This report scores AlphaFold-predicted complexes against the",
+        "AlphaJudge benchmark_26 reference set.",
+        "All percentiles are archive percentiles; higher is better.",
+    ]
+    _draw_info_box(fig, x=0.13, y=0.54, w=0.74, h=0.11, lines=info)
+
+    hist_ax = fig.add_axes((0.10, 0.36, 0.50, 0.14))
+    if scores:
+        hist_ax.hist(scores, bins=24, range=(0.0, 1.0), color="#5688c7", edgecolor="white")
+    hist_ax.set_xlim(0.0, 1.0)
+    hist_ax.set_xlabel("Interface meta score (best per complex)", fontsize=9, labelpad=2)
+    hist_ax.set_ylabel("Complexes", fontsize=9)
+    hist_ax.set_title("Distribution across cohort", fontsize=10, loc="left")
+    hist_ax.tick_params(labelsize=8)
+
+    stats_ax = fig.add_axes((0.64, 0.36, 0.26, 0.14))
+    stats_ax.axis("off")
+    if scores:
+        median = sorted(scores)[len(scores) // 2]
+        mean = sum(scores) / len(scores)
+        stats_ax.text(0.0, 0.95, "Cohort statistics", fontsize=11, fontweight="bold", transform=stats_ax.transAxes)
+        lines = [
+            f"min      = {min(scores):.3f}",
+            f"median   = {median:.3f}",
+            f"mean     = {mean:.3f}",
+            f"max      = {max(scores):.3f}",
+            f"≥ 0.5  = {sum(1 for s in scores if s >= 0.5)} ({100*sum(1 for s in scores if s >= 0.5)/len(scores):.0f}%)",
+            f"≥ 0.7  = {sum(1 for s in scores if s >= 0.7)} ({100*sum(1 for s in scores if s >= 0.7)/len(scores):.0f}%)",
+        ]
+        for i, line in enumerate(lines):
+            stats_ax.text(0.0, 0.78 - i * 0.12, line, fontsize=10, family="monospace", transform=stats_ax.transAxes)
+
+    title2_ax = fig.add_axes((0.07, 0.305, 0.86, 0.020))
+    title2_ax.axis("off")
+    title2_ax.text(
+        0.5,
+        0.5,
+        f"Top {len(top_rows)} complexes by interface meta score",
+        ha="center",
+        va="center",
+        fontsize=11,
+        fontweight="bold",
+        transform=title2_ax.transAxes,
+    )
+    headers = ["Rank", "Complex", "Meta", "LIS", "ipSAE", "ipTM", "PAE", "Sc"]
+    body: list[list[str]] = []
+    for i, (name, score, row) in enumerate(top_rows, start=1):
+        body.append(
+            [
+                str(i),
+                _truncate(name, 28),
+                _format_raw(score),
+                _format_raw(_safe_float(row.get("interface_LIS"))),
+                _format_raw(_safe_float(row.get("interface_ipSAE"))),
+                _format_raw(_safe_float(row.get("iptm"))),
+                _format_raw(_safe_float(row.get("average_interface_pae"))),
+                _format_raw(_safe_float(row.get("interface_sc"))),
+            ]
+        )
+    col_fracs = [0.07, 0.30, 0.10, 0.10, 0.10, 0.10, 0.10, 0.13]
+    _draw_fixed_table(
+        fig,
+        x=0.07,
+        y_top=0.285,
+        w=0.86,
+        headers=headers,
+        rows=body,
+        col_fracs=col_fracs,
+        row_height=0.020,
+    )
+
+    _add_page_footer(fig, page_no=page_no, total=total, last=False)
+    pdf.savefig(fig)
+    plt.close(fig)
+
+
+def _complex_summary_page(
+    pdf: PdfPages,
+    *,
+    complex_name: str,
+    rows: Sequence[Mapping[str, Any]],
+    cohort_position: tuple[int, int] | None,
+    page_no: int,
+    total: int,
+    last: bool,
+) -> None:
+    best = _best_row(rows) or rows[0]
+    fig = _new_figure()
+    _add_page_header(
+        fig, page_no=page_no, total=total,
+        title=_REPORT_TITLE, entry=_truncate(complex_name, 40),
+    )
+
+    title_ax = fig.add_axes((0.07, 0.91, 0.86, 0.05))
+    title_ax.axis("off")
+    title_ax.text(
+        0.5,
+        0.5,
+        complex_name,
+        ha="center",
+        va="center",
+        fontsize=17,
+        fontweight="bold",
+        transform=title_ax.transAxes,
+    )
+
+    sub_ax = fig.add_axes((0.07, 0.875, 0.86, 0.025))
+    sub_ax.axis("off")
+    bits = [
+        f"Model {best.get('model_used', '?')}",
+        f"Interface {best.get('interface', '?')}",
+    ]
+    if cohort_position is not None:
+        bits.append(f"Rank {cohort_position[0]} of {cohort_position[1]}")
+    n_res = best.get("interface_num_intf_residues")
+    if n_res:
+        bits.append(f"{n_res} interface residues")
+    sub_ax.text(0.5, 0.5, "  •  ".join(bits), ha="center", va="center", fontsize=10, color="#222", transform=sub_ax.transAxes)
+
+    _draw_section_heading(
+        fig, x=0.07, y=0.83, w=0.86, h=0.025,
+        number="1", title="Overall quality at a glance",
+    )
+
+    _draw_slider_panel(fig, top=0.79, height=0.62, row=best, include_overall=True)
+
+    note_ax = fig.add_axes((0.10, 0.07, 0.80, 0.06))
+    note_ax.axis("off")
+    note_ax.text(
+        0.5,
+        1.0,
+        "Black marker shows this complex's percentile rank against the AlphaJudge benchmark "
+        "(higher = better).",
+        ha="center",
+        va="top",
+        fontsize=9,
+        color="#555",
+        transform=note_ax.transAxes,
+    )
+
+    _add_page_footer(fig, page_no=page_no, total=total, last=last)
+    pdf.savefig(fig)
+    plt.close(fig)
+
+
+# ---------------------------------------------------------------------------
+# public API
+# ---------------------------------------------------------------------------
+
+def _find_pae_png(run_dir: Path, model_used: str) -> Path | None:
+    if not run_dir.is_dir():
+        return None
+    candidates = [
+        run_dir / f"pae_{model_used}.png",
+        *run_dir.glob(f"*{model_used}*PAE*plot*.png"),
+        *run_dir.glob(f"*{model_used}*.png"),
+        *run_dir.glob("*PAE*plot*ranked_0*.png"),
+    ]
+    seen: set[Path] = set()
+    for cand in candidates:
+        if cand in seen:
+            continue
+        seen.add(cand)
+        if cand.exists() and cand.is_file():
+            return cand
+    return None
+
+
+def generate_per_run_report(
+    run_dir: str | Path,
+    *,
+    csv_name: str = "interfaces.csv",
+    out_pdf: str | Path | None = None,
+) -> Path | None:
+    """Build a per-run report.pdf next to ``interfaces.csv``."""
+
+    _setup_rcparams()
+
+    run_dir = Path(run_dir)
+    interfaces_csv = run_dir / csv_name
+    if not interfaces_csv.exists():
+        logger.warning("no %s in %s; skipping report", csv_name, run_dir)
+        return None
+    rows = _read_csv_rows(interfaces_csv)
+    if not rows:
+        logger.warning("empty %s in %s; skipping report", csv_name, run_dir)
+        return None
+
+    out_pdf = Path(out_pdf) if out_pdf is not None else run_dir / "report.pdf"
+    best = _best_row(rows)
+    if best is None:
+        logger.warning("no usable rows in %s; skipping report", interfaces_csv)
+        return None
+
+    by_model: "OrderedDict[str, list[Mapping[str, Any]]]" = OrderedDict()
+    for r in rows:
+        by_model.setdefault(str(r.get("model_used") or ""), []).append(r)
+    best_model = str(best.get("model_used") or "")
+    other_models = [m for m in by_model if m and m != best_model]
+
+    pae_png = _find_pae_png(run_dir, best_model)
+
+    total = 2 + (1 if pae_png else 0) + len(other_models)
+
+    entry_id = _truncate(run_dir.name, 36)
+    chains = _detect_chain_set(rows)
+    backend = _detect_backend(rows)
+    score = _row_meta_score(best)
+    score_label = "n/a" if score is None else f"{score:.3f} ({_decile_label(score)})"
+
+    meta_pairs: list[tuple[str, str]] = [
+        ("Complex", run_dir.name),
+        ("Date", datetime.now().strftime("%Y-%m-%d %H:%M")),
+        ("Backend", backend),
+        ("Chains", ", ".join(sorted(chains)) or "?"),
+        ("Interface rows", str(len(rows))),
+        ("Best model", best_model or "?"),
+        ("Best meta score", score_label),
+    ]
+    info_lines = [
+        "AlphaJudge interface validation report.",
+        "Each metric is converted to its archive percentile using the frozen benchmark",
+        "deciles; the overall meta score is the unweighted mean over available features.",
+    ]
+    software_lines: list[tuple[str, str]] = [
+        ("Reference distribution", _BENCHMARK_TAG),
+        ("Source CSV", _shorten_path(str(interfaces_csv), max_len=62)),
+        ("Models analysed", _truncate(", ".join(by_model.keys()) or "?", 60)),
+    ]
+
+    out_pdf.parent.mkdir(parents=True, exist_ok=True)
+    with PdfPages(str(out_pdf)) as pdf:
+        page_no = 1
+        _cover_page(
+            pdf,
+            title=_REPORT_TITLE,
+            subtitle_lines=[run_dir.name, backend],
+            entry_id=entry_id,
+            meta_pairs=meta_pairs,
+            info_lines=info_lines,
+            software_lines=software_lines,
+            page_no=page_no,
+            total=total,
+        )
+
+        page_no += 1
+        _quality_page(
+            pdf,
+            title=_REPORT_TITLE,
+            entry_id=entry_id,
+            section_no="1",
+            section_title="Overall quality at a glance",
+            pre_lines=[
+                f"Best model: {best_model}",
+                f"Best interface: {best.get('interface', '?')}    Residues at interface: {best.get('interface_num_intf_residues', '?')}",
+            ],
+            row=best,
+            page_no=page_no,
+            total=total,
+            last=(page_no == total),
+        )
+
+        if pae_png is not None:
+            page_no += 1
+            _pae_page(
+                pdf,
+                title=_REPORT_TITLE,
+                entry_id=entry_id,
+                section_no="2",
+                image_path=pae_png,
+                model_label=best_model,
+                page_no=page_no,
+                total=total,
+                last=(page_no == total),
+            )
+
+        next_section = 3 if pae_png is not None else 2
+        for m in other_models:
+            m_rows = by_model[m]
+            m_best = _best_row(m_rows) or m_rows[0]
+            page_no += 1
+            _quality_page(
+                pdf,
+                title=_REPORT_TITLE,
+                entry_id=entry_id,
+                section_no=f"A.{m}",
+                section_title=f"Appendix – model {m}",
+                pre_lines=[
+                    f"Interface: {m_best.get('interface', '?')}",
+                    f"Residues at interface: {m_best.get('interface_num_intf_residues', '?')}",
+                ],
+                row=m_best,
+                page_no=page_no,
+                total=total,
+                last=(page_no == total),
+            )
+
+    logger.info("wrote %s", out_pdf)
+    return out_pdf
+
+
+def generate_aggregate_report(
+    summary_csv: str | Path,
+    *,
+    out_pdf: str | Path,
+    top_n: int = 10,
+    max_complexes: int | None = None,
+) -> Path | None:
+    """Build a multi-page aggregate validation PDF from a merged interfaces CSV."""
+
+    _setup_rcparams()
+
+    summary_csv = Path(summary_csv)
+    if not summary_csv.exists():
+        logger.warning("summary CSV not found: %s", summary_csv)
+        return None
+    rows = _read_csv_rows(summary_csv)
+    if not rows:
+        logger.warning("empty summary CSV: %s", summary_csv)
+        return None
+
+    grouped = _group_complex_rows(rows)
+    if not grouped:
+        logger.warning("no grouping key (jobs/pair) in %s", summary_csv)
+        return None
+
+    ranked: list[tuple[str, float, Mapping[str, Any]]] = []
+    for name, complex_rows in grouped.items():
+        best = _best_row(complex_rows)
+        if best is None:
+            continue
+        score = _row_meta_score(best)
+        if score is None:
+            continue
+        ranked.append((name, score, best))
+    ranked.sort(key=lambda t: t[1], reverse=True)
+
+    top_rows = ranked[:top_n]
+    if max_complexes is not None:
+        ranked_per_page = ranked[:max_complexes]
+    else:
+        ranked_per_page = ranked
+
+    backends: dict[str, int] = {}
+    for name, complex_rows in grouped.items():
+        b = _detect_backend(complex_rows)
+        backends[b] = backends.get(b, 0) + 1
+
+    scores = [s for (_, s, _) in ranked]
+    total = 1 + len(ranked_per_page)
+
+    out_pdf = Path(out_pdf)
+    out_pdf.parent.mkdir(parents=True, exist_ok=True)
+    with PdfPages(str(out_pdf)) as pdf:
+        _aggregate_cover_page(
+            pdf,
+            summary_csv=summary_csv,
+            n_complexes=len(grouped),
+            n_rows=len(rows),
+            scores=scores,
+            top_rows=top_rows,
+            backends=backends,
+            page_no=1,
+            total=total,
+        )
+        for rank, (name, _score, _best) in enumerate(ranked_per_page, start=1):
+            complex_rows = grouped[name]
+            _complex_summary_page(
+                pdf,
+                complex_name=name,
+                rows=complex_rows,
+                cohort_position=(rank, len(ranked_per_page)),
+                page_no=1 + rank,
+                total=total,
+                last=(rank == len(ranked_per_page)),
+            )
+
+    logger.info("wrote %s", out_pdf)
+    return out_pdf
+
+
+def main_aggregate(argv: list[str] | None = None) -> None:
+    """Console entry point for ``alphajudge-report``."""
+    import argparse
+
+    parser = argparse.ArgumentParser(
+        "alphajudge-report",
+        description="Generate an RCSB-style validation PDF from an AlphaJudge interfaces CSV.",
+    )
+    parser.add_argument(
+        "input",
+        help="Either a run directory (with interfaces.csv) or a merged summary CSV.",
+    )
+    parser.add_argument("--out-pdf", required=True, help="Output PDF path.")
+    parser.add_argument(
+        "--csv-name",
+        default="interfaces.csv",
+        help="CSV filename inside a run directory (default: interfaces.csv).",
+    )
+    parser.add_argument(
+        "--top-n",
+        type=int,
+        default=10,
+        help="Top-N rows shown on the aggregate cover (aggregate mode only).",
+    )
+    parser.add_argument(
+        "--max-complexes",
+        type=int,
+        default=None,
+        help="Optional cap on per-complex pages in aggregate mode.",
+    )
+    args = parser.parse_args(argv)
+
+    logging.basicConfig(level=logging.INFO, format="%(levelname)s:%(message)s")
+    src = Path(args.input)
+    if src.is_dir():
+        result = generate_per_run_report(
+            src, csv_name=args.csv_name, out_pdf=args.out_pdf
+        )
+    else:
+        result = generate_aggregate_report(
+            src,
+            out_pdf=args.out_pdf,
+            top_n=args.top_n,
+            max_complexes=args.max_complexes,
+        )
+    if result is None:
+        raise SystemExit(2)
+
+
+if __name__ == "__main__":
+    main_aggregate()
diff --git a/test/test_report.py b/test/test_report.py
new file mode 100644
index 00000000..d4defb62
--- /dev/null
+++ b/test/test_report.py
@@ -0,0 +1,122 @@
+from __future__ import annotations
+
+import csv
+from pathlib import Path
+
+import pytest
+
+from alphajudge.report import (
+    generate_aggregate_report,
+    generate_per_run_report,
+)
+
+
+_BASE_ROW = {
+    "jobs": "PROT_A_PROT_B",
+    "model_used": "model_1_multimer_v3_pred_0",
+    "interface": "A_B",
+    "iptm_ptm": "0.55",
+    "iptm": "0.55",
+    "ptm": "0.60",
+    "confidence_score": "0.62",
+    "pDockQ/mpDockQ": "0.40",
+    "average_interface_pae": "10.0",
+    "interface_average_plddt": "78.5",
+    "interface_num_intf_residues": "42",
+    "interface_polar": "11",
+    "interface_hydrophobic": "14",
+    "interface_charged": "9",
+    "interface_contact_pairs": "82",
+    "interface_score": "0.41",
+    "interface_pDockQ2": "0.06",
+    "interface_ipSAE": "0.45",
+    "interface_LIS": "0.30",
+    "interface_hb": "5",
+    "interface_sb": "2",
+    "interface_ss": "0",
+    "interface_sc": "0.50",
+    "interface_zernike_sc": "0.40",
+    "interface_area": "2300.0",
+    "interface_solv_en": "-32.0",
+    "interface_meta_score": "0.55",
+}
+
+
+def _write_csv(path: Path, rows: list[dict[str, str]]) -> None:
+    path.parent.mkdir(parents=True, exist_ok=True)
+    with path.open("w", newline="") as fh:
+        writer = csv.DictWriter(fh, fieldnames=list(rows[0].keys()))
+        writer.writeheader()
+        writer.writerows(rows)
+
+
+def _pdf_page_count(path: Path) -> int:
+    """Count '/Type /Page' (not '/Pages') occurrences in a small PDF."""
+    data = path.read_bytes()
+    count = 0
+    idx = 0
+    while True:
+        i = data.find(b"/Type /Page", idx)
+        if i < 0:
+            break
+        # Skip if this is actually '/Type /Pages'
+        if data[i + len(b"/Type /Page") : i + len(b"/Type /Page") + 1] == b"s":
+            idx = i + 1
+            continue
+        count += 1
+        idx = i + 1
+    return count
+
+
+def test_per_run_report_produces_a_pdf(tmp_path: Path) -> None:
+    rows = [
+        dict(_BASE_ROW),
+        {**_BASE_ROW, "model_used": "model_2_multimer_v3_pred_0",
+         "interface_meta_score": "0.40", "interface_LIS": "0.20"},
+    ]
+    _write_csv(tmp_path / "interfaces.csv", rows)
+    out = generate_per_run_report(tmp_path)
+    assert out is not None
+    assert out.exists()
+    assert out.stat().st_size > 0
+    assert _pdf_page_count(out) >= 2  # cover + per-interface table at minimum
+
+
+def test_per_run_report_returns_none_on_missing_csv(tmp_path: Path) -> None:
+    assert generate_per_run_report(tmp_path) is None
+
+
+def test_aggregate_report_writes_cover_plus_one_page_per_complex(tmp_path: Path) -> None:
+    rows = [
+        dict(_BASE_ROW),
+        {**_BASE_ROW, "jobs": "PROT_C_PROT_D",
+         "interface_meta_score": "0.80", "interface_LIS": "0.65"},
+        {**_BASE_ROW, "jobs": "PROT_C_PROT_D", "interface": "A_C",
+         "interface_meta_score": "0.40"},
+    ]
+    summary = tmp_path / "summary.csv"
+    _write_csv(summary, rows)
+    out = tmp_path / "aggregate.pdf"
+    result = generate_aggregate_report(summary, out_pdf=out)
+    assert result == out
+    assert out.exists() and out.stat().st_size > 0
+    # cover + 2 complex pages
+    assert _pdf_page_count(out) == 3
+
+
+def test_aggregate_report_handles_missing_meta_score_via_recompute(tmp_path: Path) -> None:
+    rows = []
+    base = dict(_BASE_ROW)
+    base.pop("interface_meta_score")
+    rows.append(base)
+    base2 = dict(_BASE_ROW)
+    base2["jobs"] = "PROT_E_PROT_F"
+    base2.pop("interface_meta_score")
+    rows.append(base2)
+    summary = tmp_path / "summary.csv"
+    _write_csv(summary, rows)
+    out = tmp_path / "agg.pdf"
+    result = generate_aggregate_report(summary, out_pdf=out)
+    assert result is not None
+    assert out.exists()
+    assert _pdf_page_count(out) == 3  # cover + 2 complexes

From e699ed12ad9fb0f33a00caa1b15faf25976624bf Mon Sep 17 00:00:00 2001
From: Dima Molodenskiy <dmolodenskiy@embl-hamburg.de>
Date: Wed, 27 May 2026 13:58:46 +0200
Subject: [PATCH 03/15] Wire validation report into AlphaJudge CLI and runner

Surfaces the report module so reports can be generated as part of a
scoring run without an explicit second step.

CLI (alphajudge):
  - Mutually-exclusive --report / --no-report flags. Default is on when a
    single run is scored and off when --summary is requested, so
    benchmark aggregations stay fast.
  - --aggregate_report PATH writes a cohort PDF from the --summary CSV
    after scoring finishes (errors out if --summary is missing).

Runner:
  - process_many / _process_one_run gain a write_per_run_report kwarg
    that invokes the report module via a defensive
    _safe_write_per_run_report helper after each per-run CSV is
    materialised (including the reuse paths). The helper imports the
    report module lazily and swallows any import or runtime error so a
    matplotlib hiccup never blocks scoring.

Packaging:
  - pyproject bumps version to 1.0.1 and exposes the alphajudge-report
    console entry, which dispatches to per-run or aggregate mode based
    on whether the input is a directory or a CSV.
---
 pyproject.toml           |  1 +
 src/alphajudge/cli.py    | 64 ++++++++++++++++++++++++++++++----------
 src/alphajudge/runner.py | 22 ++++++++++++++
 3 files changed, 71 insertions(+), 16 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index 35a6413e..93f7913a 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -49,6 +49,7 @@ test = [
 
 [project.scripts]
 alphajudge = "alphajudge.cli:main"
+alphajudge-report = "alphajudge.report:main_aggregate"
 
 [project.urls]
 Homepage = "https://github.com/KosinskiLab/AlphaJudge"
diff --git a/src/alphajudge/cli.py b/src/alphajudge/cli.py
index 0970c6cf..92800368 100644
--- a/src/alphajudge/cli.py
+++ b/src/alphajudge/cli.py
@@ -3,6 +3,7 @@
 import argparse
 import logging
 
+from .report import generate_aggregate_report
 from .runner import process_many
 
 
@@ -41,26 +42,57 @@ def main() -> None:
         default=1,
         help="Number of processes to use across run directories (0 = all available cores)",
     )
+    report_group = p.add_mutually_exclusive_group()
+    report_group.add_argument(
+        "--report",
+        dest="report",
+        action="store_true",
+        help="Write an RCSB-style report.pdf next to each per-run interfaces.csv "
+             "(default on for single-run scoring, off when --summary is used).",
+    )
+    report_group.add_argument(
+        "--no-report",
+        dest="report",
+        action="store_false",
+        help="Skip per-run report.pdf generation.",
+    )
+    p.set_defaults(report=None)
+    p.add_argument(
+        "--aggregate_report",
+        default=None,
+        help="If set, write an aggregate validation PDF to this path. "
+             "Reads the --summary CSV after scoring.",
+    )
     args = p.parse_args()
     logging.basicConfig(level=logging.INFO, format="%(levelname)s:%(message)s")
-    if args.paths:
-        process_many(
-            args.paths,
-            args.contact_thresh,
-            args.pae_filter,
-            args.models_to_analyse,
-            recursive=args.recursive,
-            summary_csv=args.summary,
-            cores=args.cores,
-            ipsae_pae_cutoff=args.ipsae_pae_cutoff,
-            force_recompute=args.force_recompute,
-            per_run_csv_name=args.per_run_csv_name,
-            skip_pae_png=args.skip_pae_png,
-            skip_biophysical_scores=args.skip_biophysical_scores,
-        )
-    else:
+    if not args.paths:
         p.error("Provide PATHS")
 
+    write_per_run_report = args.report
+    if write_per_run_report is None:
+        write_per_run_report = args.summary is None
+
+    process_many(
+        args.paths,
+        args.contact_thresh,
+        args.pae_filter,
+        args.models_to_analyse,
+        recursive=args.recursive,
+        summary_csv=args.summary,
+        cores=args.cores,
+        ipsae_pae_cutoff=args.ipsae_pae_cutoff,
+        force_recompute=args.force_recompute,
+        per_run_csv_name=args.per_run_csv_name,
+        skip_pae_png=args.skip_pae_png,
+        skip_biophysical_scores=args.skip_biophysical_scores,
+        write_per_run_report=write_per_run_report,
+    )
+
+    if args.aggregate_report:
+        if not args.summary:
+            p.error("--aggregate_report requires --summary")
+        generate_aggregate_report(args.summary, out_pdf=args.aggregate_report)
+
 
 if __name__ == "__main__":
     main()
diff --git a/src/alphajudge/runner.py b/src/alphajudge/runner.py
index a94f5af4..808fb3f5 100644
--- a/src/alphajudge/runner.py
+++ b/src/alphajudge/runner.py
@@ -218,6 +218,7 @@ def _process_one_run(
     per_run_csv_name: str,
     skip_pae_png: bool,
     skip_biophysical_scores: bool,
+    write_per_run_report: bool = False,
 ) -> tuple[str, list[dict]]:
     """
     Worker: process a single run dir (or reuse interfaces.csv) and optionally return rows for aggregation.
@@ -234,6 +235,8 @@ def _process_one_run(
             rows = _read_csv_rows(existing_csv)
             if rows:
                 logger.info(f"reused existing {existing_csv} for aggregation")
+                if write_per_run_report:
+                    _safe_write_per_run_report(d, csv_name=per_run_csv_name)
                 return (d_str, rows)
             logger.info(f"existing {existing_csv} is empty; recomputing")
         except Exception as e:
@@ -242,6 +245,8 @@ def _process_one_run(
     # If no summary requested but interfaces.csv exists, skip recompute
     if not want_summary and existing_csv.exists() and not force_recompute:
         logger.info(f"reused existing {existing_csv}; skipping recompute")
+        if write_per_run_report:
+            _safe_write_per_run_report(d, csv_name=per_run_csv_name)
         return (d_str, [])
 
     out_path = process(
@@ -255,6 +260,9 @@ def _process_one_run(
         skip_biophysical_scores=skip_biophysical_scores,
     )
 
+    if write_per_run_report and out_path is not None:
+        _safe_write_per_run_report(d, csv_name=per_run_csv_name)
+
     if want_summary and out_path is not None:
         try:
             return (d_str, _read_csv_rows(Path(out_path)))
@@ -264,6 +272,17 @@ def _process_one_run(
     return (d_str, [])
 
 
+def _safe_write_per_run_report(run_dir: Path, *, csv_name: str = "interfaces.csv") -> None:
+    """Generate report.pdf next to the per-run CSV, swallowing import/runtime errors."""
+    try:
+        # Import here so a missing matplotlib backend, etc., never blocks scoring.
+        from .report import generate_per_run_report
+
+        generate_per_run_report(run_dir, csv_name=csv_name)
+    except Exception as e:  # pragma: no cover - defensive
+        logger.warning(f"per-run report failed for {run_dir}: {e}")
+
+
 def process_many(
     paths: list[str],
     contact_thresh: float,
@@ -277,6 +296,7 @@ def process_many(
     per_run_csv_name: str = "interfaces.csv",
     skip_pae_png: bool = False,
     skip_biophysical_scores: bool = False,
+    write_per_run_report: bool = False,
 ) -> Path | None:
     """
     Process one or more directories. Optionally recurse into nested directories
@@ -349,6 +369,7 @@ def process_many(
                     per_run_csv_name,
                     skip_pae_png,
                     skip_biophysical_scores,
+                    write_per_run_report,
                 )
                 if summary_csv and rows:
                     aggregated_rows.extend(rows)
@@ -372,6 +393,7 @@ def process_many(
                     per_run_csv_name,
                     skip_pae_png,
                     skip_biophysical_scores,
+                    write_per_run_report,
                 )
                 for d in unique_run_dirs
             ]

From d95c3dfd50cd11e406b6b446b7bafc25b7977a04 Mon Sep 17 00:00:00 2001
From: Dima Molodenskiy <dmolodenskiy@embl-hamburg.de>
Date: Wed, 27 May 2026 15:13:31 +0200
Subject: [PATCH 04/15] Show per-interface table page for multimer runs

When a run has more than one chain-pair interface (any multimer
prediction), include a "Per-interface raw scores" page between the
overall quality slider panel and the PAE heatmap. Rows are sorted by
interface_meta_score descending so the strongest interfaces appear
first, making it easy to read off which subcomplex pairs are well
predicted and which are not.

For single-interface dimers nothing changes -- the page is skipped so
the report stays compact.

Also tightens the per-interface table layout: column widths give the
Interface and Residues headers enough room, the intro text is split
across two short lines instead of one wide one that clipped on A4, and
the table sits at y_top=0.78 with row_height=0.024 so 15+ rows fit
without crowding the footer.
---
 src/alphajudge/report.py | 51 ++++++++++++++++++++++++++++++++--------
 1 file changed, 41 insertions(+), 10 deletions(-)

diff --git a/src/alphajudge/report.py b/src/alphajudge/report.py
index e386d215..756d02aa 100644
--- a/src/alphajudge/report.py
+++ b/src/alphajudge/report.py
@@ -867,13 +867,22 @@ def _per_interface_page(
         number=section_no, title="Per-interface raw scores",
     )
 
-    intro_ax = fig.add_axes((0.10, 0.84, 0.80, 0.05))
+    intro_ax = fig.add_axes((0.10, 0.83, 0.80, 0.06))
     intro_ax.axis("off")
     intro_ax.text(
         0.0,
         1.0,
-        "Each row is one chain pair detected by AlphaJudge. The Meta column is the "
-        "averaged percentile across the 10 metascore features (higher is better).",
+        "Each row is one chain pair detected by AlphaJudge.",
+        fontsize=9,
+        ha="left",
+        va="top",
+        transform=intro_ax.transAxes,
+    )
+    intro_ax.text(
+        0.0,
+        0.55,
+        "The Meta column is the averaged percentile across the 10 metascore "
+        "features (higher is better).",
         fontsize=9,
         ha="left",
         va="top",
@@ -881,8 +890,13 @@ def _per_interface_page(
     )
 
     headers = ["Model", "Interface", "Residues", "Meta", "LIS", "ipSAE", "pDockQ2", "ipTM", "PAE", "Sc"]
+    sorted_rows = sorted(
+        rows,
+        key=lambda r: (_row_meta_score(r) if _row_meta_score(r) is not None else -1.0),
+        reverse=True,
+    )
     body: list[list[str]] = []
-    for r in rows:
+    for r in sorted_rows:
         body.append(
             [
                 _truncate(str(r.get("model_used") or ""), 26),
@@ -898,16 +912,16 @@ def _per_interface_page(
             ]
         )
 
-    col_fracs = [0.21, 0.09, 0.08, 0.08, 0.08, 0.09, 0.10, 0.07, 0.08, 0.12]
+    col_fracs = [0.18, 0.10, 0.10, 0.08, 0.08, 0.09, 0.10, 0.07, 0.08, 0.12]
     _draw_fixed_table(
         fig,
         x=0.07,
-        y_top=0.80,
+        y_top=0.78,
         w=0.86,
         headers=headers,
         rows=body,
         col_fracs=col_fracs,
-        row_height=0.026,
+        row_height=0.024,
     )
 
     _add_page_footer(fig, page_no=page_no, total=total, last=last)
@@ -1207,8 +1221,10 @@ def generate_per_run_report(
     other_models = [m for m in by_model if m and m != best_model]
 
     pae_png = _find_pae_png(run_dir, best_model)
+    unique_interfaces = {str(r.get("interface") or "") for r in rows}
+    show_interface_table = len(unique_interfaces) > 1
 
-    total = 2 + (1 if pae_png else 0) + len(other_models)
+    total = 2 + (1 if show_interface_table else 0) + (1 if pae_png else 0) + len(other_models)
 
     entry_id = _truncate(run_dir.name, 36)
     chains = _detect_chain_set(rows)
@@ -1268,21 +1284,36 @@ def generate_per_run_report(
             last=(page_no == total),
         )
 
+        next_section = 2
+        if show_interface_table:
+            page_no += 1
+            _per_interface_page(
+                pdf,
+                title=_REPORT_TITLE,
+                entry_id=entry_id,
+                section_no=str(next_section),
+                rows=rows,
+                page_no=page_no,
+                total=total,
+                last=(page_no == total),
+            )
+            next_section += 1
+
         if pae_png is not None:
             page_no += 1
             _pae_page(
                 pdf,
                 title=_REPORT_TITLE,
                 entry_id=entry_id,
-                section_no="2",
+                section_no=str(next_section),
                 image_path=pae_png,
                 model_label=best_model,
                 page_no=page_no,
                 total=total,
                 last=(page_no == total),
             )
+            next_section += 1
 
-        next_section = 3 if pae_png is not None else 2
         for m in other_models:
             m_rows = by_model[m]
             m_best = _best_row(m_rows) or m_rows[0]

From 37f893a6b13bfcfdb921598665a6a4acdcec48ab Mon Sep 17 00:00:00 2001
From: Dima Molodenskiy <dmolodenskiy@embl-hamburg.de>
Date: Wed, 27 May 2026 15:20:04 +0200
Subject: [PATCH 05/15] Emit per-interface slider pages and tighten cover
 wording

Per-interface pages:
  generate_per_run_report now produces one "Overall quality at a glance"
  page per detected interface, sorted by interface_meta_score
  descending, instead of only showing the best chain pair. For a 15-
  interface multimer that means 15 slider pages numbered 2.1 .. 2.15,
  preceded by the cohort overview table. Dimers with a single interface
  still get exactly one quality page numbered "1" (no sub-index) so
  their reports stay compact. Each page's pre-header now shows the
  model name + chain pair + residue count for that specific interface,
  not just the best one.

Cover info box:
  Replace "frozen benchmark deciles" with the more accurate "frozen
  benchmark distribution"; expand the explanation onto a fourth line so
  the pink box no longer crops the closing words.
---
 src/alphajudge/report.py | 73 +++++++++++++++++++++++++++-------------
 1 file changed, 49 insertions(+), 24 deletions(-)

diff --git a/src/alphajudge/report.py b/src/alphajudge/report.py
index 756d02aa..23582fb4 100644
--- a/src/alphajudge/report.py
+++ b/src/alphajudge/report.py
@@ -1221,10 +1221,23 @@ def generate_per_run_report(
     other_models = [m for m in by_model if m and m != best_model]
 
     pae_png = _find_pae_png(run_dir, best_model)
-    unique_interfaces = {str(r.get("interface") or "") for r in rows}
-    show_interface_table = len(unique_interfaces) > 1
-
-    total = 2 + (1 if show_interface_table else 0) + (1 if pae_png else 0) + len(other_models)
+    # Pick the best model's rows for the per-interface slider pages; sort by
+    # metascore descending so the strongest interface comes first.
+    best_model_rows = by_model.get(best_model, list(rows))
+    interface_rows = sorted(
+        best_model_rows,
+        key=lambda r: (_row_meta_score(r) if _row_meta_score(r) is not None else -1.0),
+        reverse=True,
+    )
+    show_interface_table = len(interface_rows) > 1
+
+    total = (
+        1  # cover
+        + (1 if show_interface_table else 0)  # overview table
+        + len(interface_rows)  # one slider page per interface
+        + (1 if pae_png else 0)  # PAE heatmap
+        + len(other_models)  # non-best-model appendix
+    )
 
     entry_id = _truncate(run_dir.name, 36)
     chains = _detect_chain_set(rows)
@@ -1243,8 +1256,9 @@ def generate_per_run_report(
     ]
     info_lines = [
         "AlphaJudge interface validation report.",
-        "Each metric is converted to its archive percentile using the frozen benchmark",
-        "deciles; the overall meta score is the unweighted mean over available features.",
+        "Each metric is converted to its archive percentile against the frozen",
+        "benchmark distribution; the overall meta score is the unweighted mean over",
+        "available features.",
     ]
     software_lines: list[tuple[str, str]] = [
         ("Reference distribution", _BENCHMARK_TAG),
@@ -1267,24 +1281,7 @@ def generate_per_run_report(
             total=total,
         )
 
-        page_no += 1
-        _quality_page(
-            pdf,
-            title=_REPORT_TITLE,
-            entry_id=entry_id,
-            section_no="1",
-            section_title="Overall quality at a glance",
-            pre_lines=[
-                f"Best model: {best_model}",
-                f"Best interface: {best.get('interface', '?')}    Residues at interface: {best.get('interface_num_intf_residues', '?')}",
-            ],
-            row=best,
-            page_no=page_no,
-            total=total,
-            last=(page_no == total),
-        )
-
-        next_section = 2
+        next_section = 1
         if show_interface_table:
             page_no += 1
             _per_interface_page(
@@ -1299,6 +1296,34 @@ def generate_per_run_report(
             )
             next_section += 1
 
+        quality_section_no = next_section
+        for i, row in enumerate(interface_rows):
+            page_no += 1
+            iface_label = str(row.get("interface") or "?")
+            n_res = row.get("interface_num_intf_residues") or "?"
+            if show_interface_table:
+                section_title = f"Interface {iface_label}"
+                section_no = f"{quality_section_no}.{i + 1}"
+            else:
+                section_title = "Overall quality at a glance"
+                section_no = str(quality_section_no)
+            _quality_page(
+                pdf,
+                title=_REPORT_TITLE,
+                entry_id=entry_id,
+                section_no=section_no,
+                section_title=section_title,
+                pre_lines=[
+                    f"Model: {row.get('model_used', best_model)}",
+                    f"Chain pair: {iface_label}    Residues at interface: {n_res}",
+                ],
+                row=row,
+                page_no=page_no,
+                total=total,
+                last=(page_no == total),
+            )
+        next_section = quality_section_no + 1
+
         if pae_png is not None:
             page_no += 1
             _pae_page(

From e63cecb836fdbea68baddad980cdddc7885ccd13 Mon Sep 17 00:00:00 2001
From: Dima Molodenskiy <dmolodenskiy@embl-hamburg.de>
Date: Wed, 27 May 2026 15:29:55 +0200
Subject: [PATCH 06/15] Switch aggregate report to per-interface statistics
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The cohort cover and per-page summaries now treat each chain-pair
interface as the unit of analysis, not the predicted complex. Concretely
generate_aggregate_report no longer groups rows by complex and keeps a
"best per complex" entry; it ranks every scorable interface row
directly. Consequences:

  - The histogram, min/median/mean/max, ≥0.5 and ≥0.7 counters all run
    over interfaces. A 9-chain multimer with 15 detected interfaces
    contributes 15 data points; a dimer contributes 1. Mixing the two
    in one cohort no longer under-represents multimers.
  - The "Top N" table is now "Top N interfaces by meta score" and uses
    a "complex · pair" label so multimer rows show which chain pair
    they refer to.
  - Each per-page slider panel is now an interface page, not a complex
    page (renamed _complex_summary_page -> _interface_summary_page).
    The header subtitle leads with the interface label and shows
    "Rank K of N" against the global interface ranking.
  - Backend counts in the cover meta block stay per-complex so they are
    not double-counted across a multimer's interfaces.

Cover sub-title says "N interfaces across M complexes" so users see
both axes at a glance. test/test_report.py is updated to match the new
page count (cover + one page per scorable interface row).
---
 src/alphajudge/report.py | 103 +++++++++++++++++++++------------------
 test/test_report.py      |   8 +--
 2 files changed, 60 insertions(+), 51 deletions(-)

diff --git a/src/alphajudge/report.py b/src/alphajudge/report.py
index 23582fb4..82325359 100644
--- a/src/alphajudge/report.py
+++ b/src/alphajudge/report.py
@@ -971,7 +971,7 @@ def _aggregate_cover_page(
     *,
     summary_csv: Path,
     n_complexes: int,
-    n_rows: int,
+    n_interfaces: int,
     scores: Sequence[float],
     top_rows: Sequence[tuple[str, float, Mapping[str, Any]]],
     backends: Mapping[str, int],
@@ -1001,7 +1001,7 @@ def _aggregate_cover_page(
     sub_ax.text(
         0.5,
         0.5,
-        f"Aggregate report – {n_complexes} complexes",
+        f"Aggregate report – {n_interfaces} interfaces across {n_complexes} complexes",
         ha="center",
         va="center",
         fontsize=11,
@@ -1013,7 +1013,7 @@ def _aggregate_cover_page(
         ("Source", _shorten_path(str(summary_csv), max_len=58)),
         ("Date", datetime.now().strftime("%Y-%m-%d %H:%M")),
         ("Complexes", str(n_complexes)),
-        ("Interface rows", str(n_rows)),
+        ("Interfaces", str(n_interfaces)),
     ]
     if backends:
         meta.append(("Backends", ", ".join(f"{k}={v}" for k, v in backends.items())))
@@ -1030,8 +1030,8 @@ def _aggregate_cover_page(
     if scores:
         hist_ax.hist(scores, bins=24, range=(0.0, 1.0), color="#5688c7", edgecolor="white")
     hist_ax.set_xlim(0.0, 1.0)
-    hist_ax.set_xlabel("Interface meta score (best per complex)", fontsize=9, labelpad=2)
-    hist_ax.set_ylabel("Complexes", fontsize=9)
+    hist_ax.set_xlabel("Interface meta score (one point per interface)", fontsize=9, labelpad=2)
+    hist_ax.set_ylabel("Interfaces", fontsize=9)
     hist_ax.set_title("Distribution across cohort", fontsize=10, loc="left")
     hist_ax.tick_params(labelsize=8)
 
@@ -1057,20 +1057,20 @@ def _aggregate_cover_page(
     title2_ax.text(
         0.5,
         0.5,
-        f"Top {len(top_rows)} complexes by interface meta score",
+        f"Top {len(top_rows)} interfaces by meta score",
         ha="center",
         va="center",
         fontsize=11,
         fontweight="bold",
         transform=title2_ax.transAxes,
     )
-    headers = ["Rank", "Complex", "Meta", "LIS", "ipSAE", "ipTM", "PAE", "Sc"]
+    headers = ["Rank", "Complex / interface", "Meta", "LIS", "ipSAE", "ipTM", "PAE", "Sc"]
     body: list[list[str]] = []
     for i, (name, score, row) in enumerate(top_rows, start=1):
         body.append(
             [
                 str(i),
-                _truncate(name, 28),
+                _truncate(name, 34),
                 _format_raw(score),
                 _format_raw(_safe_float(row.get("interface_LIS"))),
                 _format_raw(_safe_float(row.get("interface_ipSAE"))),
@@ -1079,7 +1079,7 @@ def _aggregate_cover_page(
                 _format_raw(_safe_float(row.get("interface_sc"))),
             ]
         )
-    col_fracs = [0.07, 0.30, 0.10, 0.10, 0.10, 0.10, 0.10, 0.13]
+    col_fracs = [0.07, 0.34, 0.09, 0.09, 0.10, 0.09, 0.10, 0.12]
     _draw_fixed_table(
         fig,
         x=0.07,
@@ -1096,21 +1096,22 @@ def _aggregate_cover_page(
     plt.close(fig)
 
 
-def _complex_summary_page(
+def _interface_summary_page(
     pdf: PdfPages,
     *,
     complex_name: str,
-    rows: Sequence[Mapping[str, Any]],
+    interface_label: str,
+    row: Mapping[str, Any],
     cohort_position: tuple[int, int] | None,
     page_no: int,
     total: int,
     last: bool,
 ) -> None:
-    best = _best_row(rows) or rows[0]
     fig = _new_figure()
+    entry = f"{_truncate(complex_name, 26)} / {interface_label}"
     _add_page_header(
         fig, page_no=page_no, total=total,
-        title=_REPORT_TITLE, entry=_truncate(complex_name, 40),
+        title=_REPORT_TITLE, entry=_truncate(entry, 40),
     )
 
     title_ax = fig.add_axes((0.07, 0.91, 0.86, 0.05))
@@ -1118,7 +1119,7 @@ def _complex_summary_page(
     title_ax.text(
         0.5,
         0.5,
-        complex_name,
+        _truncate(complex_name, 60),
         ha="center",
         va="center",
         fontsize=17,
@@ -1129,12 +1130,12 @@ def _complex_summary_page(
     sub_ax = fig.add_axes((0.07, 0.875, 0.86, 0.025))
     sub_ax.axis("off")
     bits = [
-        f"Model {best.get('model_used', '?')}",
-        f"Interface {best.get('interface', '?')}",
+        f"Interface {interface_label}",
+        f"Model {row.get('model_used', '?')}",
     ]
     if cohort_position is not None:
         bits.append(f"Rank {cohort_position[0]} of {cohort_position[1]}")
-    n_res = best.get("interface_num_intf_residues")
+    n_res = row.get("interface_num_intf_residues")
     if n_res:
         bits.append(f"{n_res} interface residues")
     sub_ax.text(0.5, 0.5, "  •  ".join(bits), ha="center", va="center", fontsize=10, color="#222", transform=sub_ax.transAxes)
@@ -1144,14 +1145,14 @@ def _complex_summary_page(
         number="1", title="Overall quality at a glance",
     )
 
-    _draw_slider_panel(fig, top=0.79, height=0.62, row=best, include_overall=True)
+    _draw_slider_panel(fig, top=0.79, height=0.62, row=row, include_overall=True)
 
     note_ax = fig.add_axes((0.10, 0.07, 0.80, 0.06))
     note_ax.axis("off")
     note_ax.text(
         0.5,
         1.0,
-        "Black marker shows this complex's percentile rank against the AlphaJudge benchmark "
+        "Black marker shows this interface's percentile rank against the AlphaJudge benchmark "
         "(higher = better).",
         ha="center",
         va="top",
@@ -1370,7 +1371,11 @@ def generate_aggregate_report(
     top_n: int = 10,
     max_complexes: int | None = None,
 ) -> Path | None:
-    """Build a multi-page aggregate validation PDF from a merged interfaces CSV."""
+    """Build a multi-page aggregate validation PDF from a merged interfaces CSV.
+
+    Statistics are computed **per interface** (one data point per chain pair
+    in the merged CSV). A multimer with 15 interfaces contributes 15 points.
+    """
 
     _setup_rcparams()
 
@@ -1383,34 +1388,38 @@ def generate_aggregate_report(
         logger.warning("empty summary CSV: %s", summary_csv)
         return None
 
-    grouped = _group_complex_rows(rows)
-    if not grouped:
-        logger.warning("no grouping key (jobs/pair) in %s", summary_csv)
-        return None
-
-    ranked: list[tuple[str, float, Mapping[str, Any]]] = []
-    for name, complex_rows in grouped.items():
-        best = _best_row(complex_rows)
-        if best is None:
+    # One entry per scorable interface row.
+    ranked: list[tuple[str, str, str, float, Mapping[str, Any]]] = []
+    for r in rows:
+        cname = str(r.get("jobs") or r.get("pair") or r.get("complex") or "")
+        iface = str(r.get("interface") or "")
+        if not cname:
             continue
-        score = _row_meta_score(best)
+        score = _row_meta_score(r)
         if score is None:
             continue
-        ranked.append((name, score, best))
-    ranked.sort(key=lambda t: t[1], reverse=True)
+        label = f"{cname} · {iface}" if iface else cname
+        ranked.append((label, cname, iface, score, r))
+    if not ranked:
+        logger.warning("no scorable interface rows in %s", summary_csv)
+        return None
+    ranked.sort(key=lambda t: t[3], reverse=True)
 
-    top_rows = ranked[:top_n]
-    if max_complexes is not None:
-        ranked_per_page = ranked[:max_complexes]
-    else:
-        ranked_per_page = ranked
+    top_rows = [(label, score, r) for label, _, _, score, r in ranked[:top_n]]
+    ranked_per_page = ranked if max_complexes is None else ranked[:max_complexes]
 
+    # Backends counted per complex (so a multimer doesn't multi-count).
+    seen_backend: dict[str, str] = {}
+    for _label, cname, _iface, _score, r in ranked:
+        if cname not in seen_backend:
+            seen_backend[cname] = _detect_backend([r])
     backends: dict[str, int] = {}
-    for name, complex_rows in grouped.items():
-        b = _detect_backend(complex_rows)
+    for b in seen_backend.values():
         backends[b] = backends.get(b, 0) + 1
 
-    scores = [s for (_, s, _) in ranked]
+    scores = [s for _, _, _, s, _ in ranked]
+    n_complexes = len(seen_backend)
+    n_interfaces = len(ranked)
     total = 1 + len(ranked_per_page)
 
     out_pdf = Path(out_pdf)
@@ -1419,20 +1428,20 @@ def generate_aggregate_report(
         _aggregate_cover_page(
             pdf,
             summary_csv=summary_csv,
-            n_complexes=len(grouped),
-            n_rows=len(rows),
+            n_complexes=n_complexes,
+            n_interfaces=n_interfaces,
             scores=scores,
             top_rows=top_rows,
             backends=backends,
             page_no=1,
             total=total,
         )
-        for rank, (name, _score, _best) in enumerate(ranked_per_page, start=1):
-            complex_rows = grouped[name]
-            _complex_summary_page(
+        for rank, (_label, cname, iface, _score, r) in enumerate(ranked_per_page, start=1):
+            _interface_summary_page(
                 pdf,
-                complex_name=name,
-                rows=complex_rows,
+                complex_name=cname,
+                interface_label=iface or "?",
+                row=r,
                 cohort_position=(rank, len(ranked_per_page)),
                 page_no=1 + rank,
                 total=total,
diff --git a/test/test_report.py b/test/test_report.py
index d4defb62..8015100d 100644
--- a/test/test_report.py
+++ b/test/test_report.py
@@ -86,7 +86,7 @@ def test_per_run_report_returns_none_on_missing_csv(tmp_path: Path) -> None:
     assert generate_per_run_report(tmp_path) is None
 
 
-def test_aggregate_report_writes_cover_plus_one_page_per_complex(tmp_path: Path) -> None:
+def test_aggregate_report_writes_cover_plus_one_page_per_interface(tmp_path: Path) -> None:
     rows = [
         dict(_BASE_ROW),
         {**_BASE_ROW, "jobs": "PROT_C_PROT_D",
@@ -100,8 +100,8 @@ def test_aggregate_report_writes_cover_plus_one_page_per_complex(tmp_path: Path)
     result = generate_aggregate_report(summary, out_pdf=out)
     assert result == out
     assert out.exists() and out.stat().st_size > 0
-    # cover + 2 complex pages
-    assert _pdf_page_count(out) == 3
+    # cover + one page per scorable interface row (3 here)
+    assert _pdf_page_count(out) == 4
 
 
 def test_aggregate_report_handles_missing_meta_score_via_recompute(tmp_path: Path) -> None:
@@ -119,4 +119,4 @@ def test_aggregate_report_handles_missing_meta_score_via_recompute(tmp_path: Pat
     result = generate_aggregate_report(summary, out_pdf=out)
     assert result is not None
     assert out.exists()
-    assert _pdf_page_count(out) == 3  # cover + 2 complexes
+    assert _pdf_page_count(out) == 3  # cover + 2 interfaces

From f76317e25366dedd35785bc64ab4a8d097a53a4d Mon Sep 17 00:00:00 2001
From: Dima Molodenskiy <dmolodenskiy@embl-hamburg.de>
Date: Wed, 27 May 2026 15:34:04 +0200
Subject: [PATCH 07/15] Drop per-page footer boilerplate from validation
 reports

Two pieces of repeated text added unnecessary clutter to every page:

  - The "Percentile ranks are computed against the AlphaJudge
    benchmark distribution; higher is better for every metric
    (sign-flipped where needed)." note at the bottom of every quality
    page. The slider's "Worse <- -> Better" axis already conveys this.

  - The "AlphaJudge" left-side label and the "Continued on next page..."
    middle text in the page footer. The thin footer rule plus the page
    number on the right are enough.

After this change each page has a header rule (Page N / title / entry
id) and a footer with just the rule and "N / total" page counter.
---
 src/alphajudge/report.py | 38 +-------------------------------------
 1 file changed, 1 insertion(+), 37 deletions(-)

diff --git a/src/alphajudge/report.py b/src/alphajudge/report.py
index 82325359..010d7a4e 100644
--- a/src/alphajudge/report.py
+++ b/src/alphajudge/report.py
@@ -8,7 +8,7 @@
   marker for the entry's archive percentile;
 * a numbered "Overall quality at a glance" page with a metric/value table;
 * a page header rule with title + page number + entry id, and a
-  bottom rule with a "Continued on next page" note.
+  thin bottom rule with the page number.
 
 Two entry points:
 
@@ -241,18 +241,6 @@ def _add_page_footer(fig: plt.Figure, *, page_no: int, total: int, last: bool) -
     rule.axhline(0.5, color=_HEADER_RULE, linewidth=0.6)
     ax = fig.add_axes((0.07, 0.018, 0.86, 0.018))
     ax.axis("off")
-    if not last and page_no < total:
-        ax.text(
-            0.5,
-            0.5,
-            "Continued on next page…",
-            ha="center",
-            va="center",
-            fontsize=8,
-            color="#666",
-            style="italic",
-            transform=ax.transAxes,
-        )
     ax.text(
         1.0,
         0.5,
@@ -263,16 +251,6 @@ def _add_page_footer(fig: plt.Figure, *, page_no: int, total: int, last: bool) -
         color="#555",
         transform=ax.transAxes,
     )
-    ax.text(
-        0.0,
-        0.5,
-        "AlphaJudge",
-        ha="left",
-        va="center",
-        fontsize=8,
-        color="#555",
-        transform=ax.transAxes,
-    )
 
 
 def _draw_info_box(fig: plt.Figure, *, x: float, y: float, w: float, h: float, lines: Sequence[str]) -> None:
@@ -830,20 +808,6 @@ def _quality_page(
 
     _draw_slider_panel(fig, top=0.76, height=0.60, row=row, include_overall=True)
 
-    explanation_ax = fig.add_axes((0.10, 0.06, 0.80, 0.06))
-    explanation_ax.axis("off")
-    explanation_ax.text(
-        0.5,
-        0.9,
-        "Percentile ranks are computed against the AlphaJudge benchmark distribution; "
-        "higher is better for every metric (sign-flipped where needed).",
-        ha="center",
-        va="top",
-        fontsize=9,
-        color="#555",
-        transform=explanation_ax.transAxes,
-    )
-
     _add_page_footer(fig, page_no=page_no, total=total, last=last)
     pdf.savefig(fig)
     plt.close(fig)

From a41276995fcb957968164249e93d85cdf507ce3f Mon Sep 17 00:00:00 2001
From: Dima Molodenskiy <dmolodenskiy@embl-hamburg.de>
Date: Wed, 27 May 2026 15:36:45 +0200
Subject: [PATCH 08/15] Drop "Page N" from header (page number already in
 footer)

The page header carried "Page N" on the left, "Title" in the middle,
and "entry id" on the right. The footer already shows "N / total" at
the bottom right, so the header repeat was redundant.

Header now reads "Title  ...  entry id" only. Module docstring updated.
---
 src/alphajudge/report.py | 7 +++----
 1 file changed, 3 insertions(+), 4 deletions(-)

diff --git a/src/alphajudge/report.py b/src/alphajudge/report.py
index 010d7a4e..8d1ae692 100644
--- a/src/alphajudge/report.py
+++ b/src/alphajudge/report.py
@@ -7,8 +7,8 @@
 * a smooth red -> yellow -> green percentile slider with a single black
   marker for the entry's archive percentile;
 * a numbered "Overall quality at a glance" page with a metric/value table;
-* a page header rule with title + page number + entry id, and a
-  thin bottom rule with the page number.
+* a page header rule with title + entry id, and a thin bottom rule
+  with the page number.
 
 Two entry points:
 
@@ -227,8 +227,7 @@ def _new_figure() -> plt.Figure:
 def _add_page_header(fig: plt.Figure, *, page_no: int, total: int, title: str, entry: str) -> None:
     ax = fig.add_axes((0.07, 0.965, 0.86, 0.018))
     ax.axis("off")
-    ax.text(0.0, 0.5, f"Page {page_no}", fontsize=8, color="#333", va="center", transform=ax.transAxes)
-    ax.text(0.5, 0.5, title, fontsize=8, color="#333", va="center", ha="center", transform=ax.transAxes)
+    ax.text(0.0, 0.5, title, fontsize=8, color="#333", va="center", transform=ax.transAxes)
     ax.text(1.0, 0.5, entry, fontsize=8, color="#333", va="center", ha="right", transform=ax.transAxes)
     rule = fig.add_axes((0.07, 0.957, 0.86, 0.003))
     rule.axis("off")

From edd466c437c8234d981322af57050658dd3fefcb Mon Sep 17 00:00:00 2001
From: Dima Molodenskiy <dmolodenskiy@embl-hamburg.de>
Date: Wed, 27 May 2026 15:41:55 +0200
Subject: [PATCH 09/15] Document --report and --aggregate_report in README

Adds the new report flags to the CLI synopsis, the option list, the
output description, and an example invocation; documents the
alphajudge-report console entry that exposes the per-run and aggregate
modes outside the scoring pipeline.
---
 README.md | 20 +++++++++++++++++++-
 1 file changed, 19 insertions(+), 1 deletion(-)

diff --git a/README.md b/README.md
index eb1108fa..4e3e202b 100644
--- a/README.md
+++ b/README.md
@@ -82,7 +82,9 @@ alphajudge PATH [PATH ...] \
   --ipsae_pae_cutoff 10.0 \
   [-r|--recursive] \
   [-o|--summary SUMMARY.csv] \
-  [--cores]
+  [--cores] \
+  [--report | --no-report] \
+  [--aggregate_report AGGREGATE.pdf]
 ```
 
 - **PATH**: One or more run directories or roots to search
@@ -93,11 +95,22 @@ alphajudge PATH [PATH ...] \
 - **-r / --recursive**: Recursively discover runs under each PATH
 - **-o / --summary**: Write an aggregated CSV across all processed runs
 - **--cores**: Number of processes to use across run directories (0 = all available cores)
+- **--report / --no-report**: Write an RCSB-style `report.pdf` next to each per-run `interfaces.csv`. Default is on for single-run scoring and off when `--summary` is used, so benchmark aggregations stay fast.
+- **--aggregate_report AGGREGATE.pdf**: After scoring, build a multi-page validation PDF from the `--summary` CSV with one slider page per interface ranked by meta score (requires `--summary`).
 
 Outputs:
 - Always writes `interfaces.csv` inside each processed run directory.
 - For each processed model, also writes a PAE heatmap PNG `pae_<model>.png` next to `interfaces.csv`.
+- If `--report` is on, also writes `report.pdf` next to `interfaces.csv` -- an RCSB-style validation report with a percentile slider panel for every detected interface.
 - If `--summary` is provided, also writes a union-header CSV at the given path containing rows from all runs.
+- If `--aggregate_report` is provided, also writes a multi-page PDF with one slider page per interface across the whole cohort, plus a cover with the meta-score histogram, summary statistics, and a top-N interfaces table.
+
+A separate `alphajudge-report` console entry is also available; it dispatches to per-run mode when given a run directory and to aggregate mode when given a summary CSV:
+
+```bash
+alphajudge-report path/to/run_dir --out-pdf path/to/report.pdf
+alphajudge-report path/to/summary.csv --out-pdf path/to/aggregate.pdf
+```
 
 Examples
 
@@ -118,6 +131,11 @@ alphajudge test_data/af2/pos_dimers/Q13148+Q92900 \
 
 # Recursively discover runs under roots and write a combined summary
 alphajudge test_data/af2/pos_dimers test_data/af3/pos_dimers -r -o interfaces_summary.csv
+
+# Score a cohort and emit a cohort-wide validation PDF (one slider page per interface)
+alphajudge test_data/af2/pos_dimers -r \
+  -o interfaces_summary.csv \
+  --aggregate_report aggregate_report.pdf
 ```
 
 ---

From 012e28ec0bfb3bb8c22550714463355361fb98b1 Mon Sep 17 00:00:00 2001
From: Dima Molodenskiy <dmolodenskiy@embl-hamburg.de>
Date: Wed, 27 May 2026 15:57:32 +0200
Subject: [PATCH 10/15] Clarify that report generation covers all supported
 backends

After rebasing report_percentiles onto the Boltz-2 work, note explicitly
that --report and --aggregate_report flow through the same scoring path
for AF2, AF3, and Boltz-2 runs, and broaden the cohort-report example
to cover a mixed-backend root.
---
 README.md | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/README.md b/README.md
index 4e3e202b..62352216 100644
--- a/README.md
+++ b/README.md
@@ -105,6 +105,8 @@ Outputs:
 - If `--summary` is provided, also writes a union-header CSV at the given path containing rows from all runs.
 - If `--aggregate_report` is provided, also writes a multi-page PDF with one slider page per interface across the whole cohort, plus a cover with the meta-score histogram, summary statistics, and a top-N interfaces table.
 
+Report generation is backend-agnostic: AF2, AF3, and Boltz-2 runs all flow through the same scoring path, so `--report` and `--aggregate_report` work identically for any mix of supported predictions in one cohort. Multimers contribute one slider page per detected chain pair; dimers contribute one.
+
 A separate `alphajudge-report` console entry is also available; it dispatches to per-run mode when given a run directory and to aggregate mode when given a summary CSV:
 
 ```bash
@@ -132,8 +134,9 @@ alphajudge test_data/af2/pos_dimers/Q13148+Q92900 \
 # Recursively discover runs under roots and write a combined summary
 alphajudge test_data/af2/pos_dimers test_data/af3/pos_dimers -r -o interfaces_summary.csv
 
-# Score a cohort and emit a cohort-wide validation PDF (one slider page per interface)
-alphajudge test_data/af2/pos_dimers -r \
+# Score a cohort (any mix of AF2 / AF3 / Boltz-2 run dirs) and emit a cohort-wide
+# validation PDF with one slider page per detected interface
+alphajudge test_data/af2/pos_dimers test_data/af3/pos_dimers -r \
   -o interfaces_summary.csv \
   --aggregate_report aggregate_report.pdf
 ```

From 81a7f8729b2a9969499c0761209e9fcb03f6dc3e Mon Sep 17 00:00:00 2001
From: Dima Molodenskiy <dmolodenskiy@embl-hamburg.de>
Date: Thu, 28 May 2026 09:30:23 +0200
Subject: [PATCH 11/15] Guard --aggregate_report against a stale summary CSV

process_many returns None whenever it does not actually write the
summary (no paths, no runnable dirs, all workers produced no rows).
The CLI previously ignored that return value, so if --aggregate_report
pointed at a path that already had a CSV from a previous invocation,
generate_aggregate_report would silently consume that stale file and
emit a PDF for the wrong cohort.

Capture the returned summary path and fail loudly via p.error when it
is None, instead of building a report from data this invocation did
not produce.
---
 src/alphajudge/cli.py | 10 ++++++++--
 1 file changed, 8 insertions(+), 2 deletions(-)

diff --git a/src/alphajudge/cli.py b/src/alphajudge/cli.py
index 92800368..124fd1f6 100644
--- a/src/alphajudge/cli.py
+++ b/src/alphajudge/cli.py
@@ -72,7 +72,7 @@ def main() -> None:
     if write_per_run_report is None:
         write_per_run_report = args.summary is None
 
-    process_many(
+    summary_path = process_many(
         args.paths,
         args.contact_thresh,
         args.pae_filter,
@@ -91,7 +91,13 @@ def main() -> None:
     if args.aggregate_report:
         if not args.summary:
             p.error("--aggregate_report requires --summary")
-        generate_aggregate_report(args.summary, out_pdf=args.aggregate_report)
+        if summary_path is None:
+            p.error(
+                f"--aggregate_report requested but no summary was written to "
+                f"{args.summary}; refusing to build a report from a possibly "
+                "stale CSV"
+            )
+        generate_aggregate_report(summary_path, out_pdf=args.aggregate_report)
 
 
 if __name__ == "__main__":

From ffa0dccc2356886aee41780b12d1ddd433e8cd29 Mon Sep 17 00:00:00 2001
From: Dima Molodenskiy <dmolodenskiy@embl-hamburg.de>
Date: Thu, 28 May 2026 09:46:45 +0200
Subject: [PATCH 12/15] Make report visuals match wwPDB / RCSB more faithfully

The previous green RdYlGn gradient with boxed % and Value columns made
the page look like a dashboard. Switch to the wwPDB look:

  - Red -> pale center -> blue percentile bars (LinearSegmentedColormap),
    deliberately thin (bar_height ~0.011 of page).
  - Drop the explicit % column; percentile is conveyed by marker
    position. Three columns only: Metric | Percentile Ranks | Value.
  - Single small black marker per row, plus a thin black polyline
    connecting valid percentiles down the chart, exactly as on the
    wwPDB "Overall quality at a glance" page.
  - "Worse" / "Better" italic labels directly under the bars and a
    marker-glyph legend, in the wwPDB position.

Page chrome:

  - Cover has no running header. It leads with a small text PDB
    wordmark, the report title, and a blue circled-i icon, matching
    the RCSB cover.
  - Pages 2+ get a single-rule running header: "Page N | Title | entry".
  - Footer is just a small wordmark, no page-number rule (the running
    header already carries the page label).
  - Pink info box is square-cornered and uses wwPDB red.
  - Section headings render number + title at 17pt with a tight gap;
    the optional info icon is now off by default so it never overlaps
    chain-pair labels like "Interface B_C".

Typography:

  - rcParams switched to a Computer-Modern-style serif stack
    (CMU Serif / Latin Modern / STIXGeneral / DejaVu Serif fallback),
    mathtext "cm", base font 10pt, PDF font type 42 so text stays
    searchable in Acrobat.

The slider primitive now exposes a draw_marker switch so the per-row
bar is clean and the marker polyline is overlaid in a single axes,
which avoids axis clipping for off-bar marker rectangles.
---
 src/alphajudge/report.py | 769 +++++++++++++++++++++++++--------------
 1 file changed, 499 insertions(+), 270 deletions(-)

diff --git a/src/alphajudge/report.py b/src/alphajudge/report.py
index 8d1ae692..a2cf12fa 100644
--- a/src/alphajudge/report.py
+++ b/src/alphajudge/report.py
@@ -34,7 +34,8 @@
 import matplotlib.pyplot as plt
 import numpy as np
 from matplotlib.backends.backend_pdf import PdfPages
-from matplotlib.patches import FancyBboxPatch, Rectangle
+from matplotlib.colors import LinearSegmentedColormap
+from matplotlib.patches import Circle, FancyBboxPatch, Rectangle
 
 from .meta_score import (
     BENCHMARK_QUANTILES,
@@ -48,11 +49,25 @@
 logger = logging.getLogger(__name__)
 
 _A4 = (8.27, 11.69)
-_SLIDER_CMAP = "RdYlGn"
-_INFO_BG = "#fbe5e5"
-_INFO_EDGE = "#a83232"
-_HEADER_RULE = "#3a3a3a"
-_TABLE_RULE = "#404040"
+
+# RCSB/wwPDB percentile graphic: red -> pale center -> blue.
+# Do not use RdYlGn here; the wwPDB report uses a red/blue percentile bar.
+_SLIDER_CMAP = LinearSegmentedColormap.from_list(
+    "wwpdb_percentile",
+    [
+        (0.00, "#ff1a1a"),
+        (0.35, "#ffd1d1"),
+        (0.50, "#f4f0f0"),
+        (0.65, "#d8d8ff"),
+        (1.00, "#171cff"),
+    ],
+)
+
+_INFO_BG = "#ffb3b3"
+_INFO_EDGE = "#ff0000"
+_HEADER_RULE = "#303030"
+_TABLE_RULE = "#202020"
+_RCSB_BLUE = "#0000ff"
 
 _REPORT_TITLE = "AlphaJudge Interface Validation Report"
 _BENCHMARK_TAG = "benchmark_26 (final_sync_20260523, n=7,756 AF2/AF3 rows)"
@@ -82,18 +97,33 @@
 # ---------------------------------------------------------------------------
 
 def _setup_rcparams() -> None:
+    """Use a Computer-Modern-like serif PDF look, close to wwPDB reports."""
     rcparams = {
         "font.family": "serif",
-        "font.serif": ["DejaVu Serif", "Times New Roman", "Times"],
-        "mathtext.fontset": "dejavuserif",
-        "axes.titlesize": 11,
+        "font.serif": [
+            "CMU Serif",
+            "Computer Modern Roman",
+            "Latin Modern Roman",
+            "STIXGeneral",
+            "DejaVu Serif",
+            "Times New Roman",
+            "Times",
+        ],
+        "mathtext.fontset": "cm",
+        "font.size": 10,
+        "axes.titlesize": 10,
         "axes.labelsize": 9,
         "axes.spines.top": False,
         "axes.spines.right": False,
         "xtick.labelsize": 8,
         "ytick.labelsize": 8,
-        "axes.edgecolor": "#222222",
-        "savefig.dpi": 200,
+        "axes.edgecolor": "#202020",
+        "axes.linewidth": 0.6,
+        "savefig.dpi": 300,
+        # Keep text as searchable TrueType text in the PDF.
+        "pdf.fonttype": 42,
+        "ps.fonttype": 42,
+        "axes.unicode_minus": False,
     }
     matplotlib.rcParams.update(rcparams)
 
@@ -224,55 +254,164 @@ def _new_figure() -> plt.Figure:
     return plt.figure(figsize=_A4, facecolor="white")
 
 
-def _add_page_header(fig: plt.Figure, *, page_no: int, total: int, title: str, entry: str) -> None:
-    ax = fig.add_axes((0.07, 0.965, 0.86, 0.018))
+def _draw_info_icon(fig: plt.Figure, *, x: float, y: float, r: float = 0.010) -> None:
+    """Small blue circled 'i' like the wwPDB validation report."""
+    ax = fig.add_axes((x - r, y - r, 2 * r, 2 * r))
+    ax.set_xlim(0, 1)
+    ax.set_ylim(0, 1)
+    ax.set_aspect("equal")
     ax.axis("off")
-    ax.text(0.0, 0.5, title, fontsize=8, color="#333", va="center", transform=ax.transAxes)
-    ax.text(1.0, 0.5, entry, fontsize=8, color="#333", va="center", ha="right", transform=ax.transAxes)
-    rule = fig.add_axes((0.07, 0.957, 0.86, 0.003))
-    rule.axis("off")
-    rule.axhline(0.5, color=_HEADER_RULE, linewidth=0.8)
+    ax.add_patch(
+        Circle(
+            (0.5, 0.5),
+            0.47,
+            facecolor="white",
+            edgecolor=_RCSB_BLUE,
+            linewidth=1.0,
+            transform=ax.transAxes,
+        )
+    )
+    ax.text(
+        0.5,
+        0.48,
+        "i",
+        ha="center",
+        va="center",
+        fontsize=8,
+        color=_RCSB_BLUE,
+        fontweight="bold",
+        transform=ax.transAxes,
+    )
 
 
-def _add_page_footer(fig: plt.Figure, *, page_no: int, total: int, last: bool) -> None:
-    rule = fig.add_axes((0.07, 0.038, 0.86, 0.003))
-    rule.axis("off")
-    rule.axhline(0.5, color=_HEADER_RULE, linewidth=0.6)
-    ax = fig.add_axes((0.07, 0.018, 0.86, 0.018))
+def _draw_wordmark(
+    fig: plt.Figure,
+    *,
+    x: float = 0.5,
+    y: float = 0.93,
+    w: float = 0.20,
+    h: float = 0.060,
+    scale: float = 1.0,
+) -> None:
+    """A lightweight text stand-in for the small wwPDB/PDB wordmark.
+
+    Use an approved logo image here if you have one; this avoids bundling any
+    external logo asset while still matching the spatial rhythm of the report.
+    """
+    ax = fig.add_axes((x - w / 2, y - h / 2, w, h))
+    ax.set_xlim(0, 1)
+    ax.set_ylim(0, 1)
     ax.axis("off")
     ax.text(
-        1.0,
         0.5,
-        f"{page_no} / {total}",
+        0.88,
+        "W O R L D W I D E",
+        ha="center",
+        va="center",
+        fontsize=6.5 * scale,
+        fontweight="bold",
+        color="#202020",
+        transform=ax.transAxes,
+    )
+    ax.text(
+        0.5,
+        0.50,
+        "PDB",
+        ha="center",
+        va="center",
+        fontsize=24 * scale,
+        fontweight="bold",
+        color="#5b9b5b",
+        transform=ax.transAxes,
+    )
+    ax.text(
+        0.5,
+        0.13,
+        "PROTEIN DATA BANK",
+        ha="center",
+        va="center",
+        fontsize=5.8 * scale,
+        fontweight="bold",
+        color="#202020",
+        transform=ax.transAxes,
+    )
+
+
+def _add_page_header(fig: plt.Figure, *, page_no: int, total: int, title: str, entry: str) -> None:
+    """RCSB-style running header.
+
+    The cover page in wwPDB reports has no running header; page 2 onward does.
+    """
+    if page_no <= 1:
+        return
+
+    ax = fig.add_axes((0.07, 0.952, 0.86, 0.036))
+    ax.set_xlim(0, 1)
+    ax.set_ylim(0, 1)
+    ax.axis("off")
+    ax.text(
+        0.0,
+        0.62,
+        f"Page {page_no}",
+        fontsize=10,
+        ha="left",
+        va="center",
+        color="#111111",
+        transform=ax.transAxes,
+    )
+    ax.text(
+        0.5,
+        0.62,
+        title,
+        fontsize=10,
+        ha="center",
+        va="center",
+        color="#111111",
+        transform=ax.transAxes,
+    )
+    ax.text(
+        1.0,
+        0.62,
+        entry,
+        fontsize=10,
         ha="right",
         va="center",
-        fontsize=8,
-        color="#555",
+        color="#111111",
         transform=ax.transAxes,
     )
+    ax.plot([0.0, 1.0], [0.18, 0.18], color=_HEADER_RULE, linewidth=0.6, transform=ax.transAxes)
+
+
+def _add_page_footer(fig: plt.Figure, *, page_no: int, total: int, last: bool) -> None:
+    """RCSB-style footer: small centered wordmark, no bottom page-number rule."""
+    if page_no <= 1:
+        return
+    _draw_wordmark(fig, x=0.5, y=0.030, w=0.090, h=0.038, scale=0.42)
 
 
 def _draw_info_box(fig: plt.Figure, *, x: float, y: float, w: float, h: float, lines: Sequence[str]) -> None:
+    """Square-corner pink/red cover callout, closer to wwPDB style."""
     ax = fig.add_axes((x, y, w, h))
     ax.set_xlim(0, 1)
     ax.set_ylim(0, 1)
     ax.axis("off")
-    box = FancyBboxPatch(
-        (0.005, 0.05),
-        0.99,
-        0.90,
-        boxstyle="round,pad=0.02,rounding_size=0.02",
-        linewidth=0.6,
-        edgecolor=_INFO_EDGE,
-        facecolor=_INFO_BG,
-        transform=ax.transAxes,
+    ax.add_patch(
+        Rectangle(
+            (0.0, 0.0),
+            1.0,
+            1.0,
+            linewidth=0.8,
+            edgecolor=_INFO_EDGE,
+            facecolor=_INFO_BG,
+            transform=ax.transAxes,
+        )
     )
-    ax.add_patch(box)
-    n = len(lines)
-    if n == 0:
+    if not lines:
         return
+
+    n = len(lines)
     top = 0.83
-    line_h = 0.7 / max(1, n)
+    line_h = 0.68 / max(1, n - 1) if n > 1 else 0.0
     for i, line in enumerate(lines):
         ax.text(
             0.5,
@@ -280,8 +419,8 @@ def _draw_info_box(fig: plt.Figure, *, x: float, y: float, w: float, h: float, l
             line,
             ha="center",
             va="top",
-            fontsize=9.5,
-            color="#1d1d1d",
+            fontsize=10.5,
+            color="#111111",
             transform=ax.transAxes,
         )
 
@@ -307,36 +446,90 @@ def _draw_meta_block(fig: plt.Figure, *, x: float, y: float, w: float, h: float,
         ax.text(val_x, ypos, value, fontsize=10.5, ha="left", va="top", transform=ax.transAxes)
 
 
-def _draw_section_heading(fig: plt.Figure, *, x: float, y: float, w: float, h: float, number: str, title: str) -> None:
+def _draw_section_heading(
+    fig: plt.Figure,
+    *,
+    x: float,
+    y: float,
+    w: float,
+    h: float,
+    number: str,
+    title: str,
+    show_info: bool = False,
+) -> None:
+    """Large numbered section heading with RCSB-like spacing."""
     ax = fig.add_axes((x, y, w, h))
+    ax.set_xlim(0, 1)
+    ax.set_ylim(0, 1)
     ax.axis("off")
+
+    number_text = _truncate(str(number), 8)
+    title_x = 0.060 + max(0, len(number_text) - 2) * 0.010
+
     ax.text(
         0.0,
-        0.4,
-        f"{number}  {title}",
-        fontsize=15,
+        0.50,
+        number_text,
+        fontsize=17,
+        fontweight="bold",
+        ha="left",
+        va="center",
+        color="#101010",
+        transform=ax.transAxes,
+    )
+    ax.text(
+        title_x,
+        0.50,
+        title,
+        fontsize=17,
         fontweight="bold",
+        ha="left",
+        va="center",
         color="#101010",
         transform=ax.transAxes,
     )
 
+    if show_info:
+        # Approximate icon placement immediately after the heading.
+        icon_x = min(x + w - 0.020, x + title_x * w + 0.0120 * len(title) + 0.020)
+        _draw_info_icon(fig, x=icon_x, y=y + h * 0.52, r=0.011)
+
 
 # ---------------------------------------------------------------------------
 # slider primitive
 # ---------------------------------------------------------------------------
 
-_GRADIENT = np.tile(np.linspace(0.02, 0.98, 512), (4, 1))
+# High-resolution gradient; bars are deliberately thin.
+_GRADIENT = np.tile(np.linspace(0.0, 1.0, 1024), (2, 1))
+
+
+# Compact RCSB-like chart layout in figure coordinates.
+# These positions intentionally mimic the page-2 wwPDB chart proportions.
+_RCSB_SLIDER_LAYOUT = {
+    "label_right": 0.235,
+    "bar_x": 0.240,
+    "bar_width": 0.382,
+    "value_x": 0.632,
+    "value_width": 0.120,
+    "bar_height": 0.0105,
+    "row_height": 0.0315,
+}
+
+
+def _clip_pct(pct: float | None) -> float | None:
+    if pct is None or not math.isfinite(pct):
+        return None
+    return max(0.0, min(1.0, pct))
 
 
 def _draw_slider_bar(
     ax,
-    percentile: float | None,
+    percentile: float | None = None,
     *,
-    cmap: str = _SLIDER_CMAP,
-    show_axis: bool = False,
+    cmap=_SLIDER_CMAP,
+    draw_marker: bool = True,
 ) -> None:
-    """RCSB-style horizontal percentile bar with a single black marker."""
-
+    """Thin wwPDB-style red-white-blue percentile bar."""
     ax.imshow(
         _GRADIENT,
         aspect="auto",
@@ -346,117 +539,83 @@ def _draw_slider_bar(
     )
     ax.set_xlim(0.0, 1.0)
     ax.set_ylim(0.0, 1.0)
-    ax.set_yticks([])
-    if show_axis:
-        ax.set_xticks([0.0, 0.25, 0.5, 0.75, 1.0])
-        ax.set_xticklabels(["0", "25", "50", "75", "100"], fontsize=7)
-        ax.tick_params(axis="x", length=2, pad=1, colors="#333333")
-    else:
-        ax.set_xticks([])
-
-    for spine in ax.spines.values():
-        spine.set_visible(True)
-        spine.set_edgecolor("#1a1a1a")
-        spine.set_linewidth(0.6)
+    ax.axis("off")
 
-    if percentile is not None:
+    pct = _clip_pct(percentile)
+    if draw_marker and pct is not None:
         ax.add_patch(
             Rectangle(
-                (max(0.0, min(1.0, percentile)) - 0.005, -0.10),
-                0.010,
-                1.20,
-                color="#0e0e0e",
+                (pct - 0.006, -0.15),
+                0.012,
+                1.30,
+                facecolor="#0b0b0b",
+                edgecolor="#0b0b0b",
+                linewidth=0.4,
                 clip_on=False,
                 zorder=5,
             )
         )
 
 
-_LAYOUT = {
-    "left": 0.085,
-    "label_width": 0.190,
-    "gap_label_slider": 0.012,
-    "slider_width": 0.460,
-    "gap_slider_pct": 0.014,
-    "pct_width": 0.045,
-    "gap_pct_value": 0.010,
-    "value_width": 0.115,
-}
+def _metric_rows_for_slider_panel(
+    row: Mapping[str, Any],
+    *,
+    include_overall: bool,
+) -> list[tuple[str, float | None, float | None, str]]:
+    rows: list[tuple[str, float | None, float | None, str]] = []
+
+    if include_overall:
+        score = _row_meta_score(row)
+        rows.append(("Overall meta score", score, score, ""))
+
+    fv = _feature_view(row)
+    for feat in META_SCORE_FEATURES:
+        raw, pct = fv[feat]
+        rows.append(
+            (
+                _FEATURE_DISPLAY.get(feat, feat),
+                raw,
+                pct,
+                _FEATURE_UNITS.get(feat, ""),
+            )
+        )
+
+    return rows
 
 
-def _draw_slider_row(
+def _draw_percentile_legend(
     fig: plt.Figure,
     *,
-    bottom: float,
-    height: float,
-    label: str,
-    raw: float | None,
-    pct: float | None,
-    units: str = "",
-    show_axis: bool = False,
+    x: float,
+    y: float,
+    w: float,
+    label: str = "Percentile relative to AlphaJudge benchmark",
 ) -> None:
-    L = _LAYOUT
-    x = L["left"]
-    label_ax = fig.add_axes((x, bottom, L["label_width"], height))
-    label_ax.axis("off")
-    label_ax.text(
-        1.0,
-        0.5,
-        label,
-        fontsize=10,
-        ha="right",
-        va="center",
-        transform=label_ax.transAxes,
-    )
-    x += L["label_width"] + L["gap_label_slider"]
-
-    slider_ax = fig.add_axes(
-        (
-            x,
-            bottom + (0.20 if not show_axis else 0.30) * height,
-            L["slider_width"],
-            (0.55 if not show_axis else 0.42) * height,
+    ax = fig.add_axes((x, y, w, 0.032))
+    ax.set_xlim(0, 1)
+    ax.set_ylim(0, 1)
+    ax.axis("off")
+
+    ax.add_patch(
+        Rectangle(
+            (0.000, 0.55),
+            0.010,
+            0.30,
+            facecolor="#0b0b0b",
+            edgecolor="#0b0b0b",
+            linewidth=0.4,
+            transform=ax.transAxes,
         )
     )
-    _draw_slider_bar(slider_ax, pct, show_axis=show_axis)
-    x += L["slider_width"] + L["gap_slider_pct"]
-
-    pct_ax = fig.add_axes((x, bottom + 0.18 * height, L["pct_width"], 0.64 * height))
-    pct_ax.set_xlim(0, 1)
-    pct_ax.set_ylim(0, 1)
-    pct_ax.axis("off")
-    pct_text = "n/a" if pct is None else f"{pct * 100:0.0f}%"
-    pct_ax.text(
-        0.5,
-        0.5,
-        pct_text,
-        ha="center",
-        va="center",
-        fontsize=9,
-        color="#222222",
-        transform=pct_ax.transAxes,
-    )
-    x += L["pct_width"] + L["gap_pct_value"]
-
-    value_ax = fig.add_axes((x, bottom + 0.18 * height, L["value_width"], 0.64 * height))
-    value_ax.set_xlim(0, 1)
-    value_ax.set_ylim(0, 1)
-    value_ax.set_xticks([])
-    value_ax.set_yticks([])
-    for spine in value_ax.spines.values():
-        spine.set_edgecolor("#5a5a5a")
-        spine.set_linewidth(0.6)
-    raw_text = _format_raw(raw)
-    if units:
-        raw_text = f"{raw_text} {units}"
-    value_ax.text(
-        0.5,
-        0.5,
-        raw_text,
-        ha="center",
+    ax.text(
+        0.018,
+        0.70,
+        label,
+        ha="left",
         va="center",
-        fontsize=9,
-        transform=value_ax.transAxes,
+        fontsize=7.2,
+        color="#111111",
+        transform=ax.transAxes,
     )
 
 
@@ -467,135 +626,176 @@ def _draw_slider_panel(
     height: float,
     row: Mapping[str, Any],
     include_overall: bool = True,
-) -> None:
-    """RCSB-style 'Metric | Percentile rank | %ile | Value' table."""
-
-    rows: list[tuple[str, float | None, float | None, str]] = []
-    if include_overall:
-        score = _row_meta_score(row)
-        rows.append(("Overall meta score", score, score, ""))
-    fv = _feature_view(row)
-    for feat in META_SCORE_FEATURES:
-        raw, pct = fv[feat]
-        rows.append((_FEATURE_DISPLAY.get(feat, feat), raw, pct, _FEATURE_UNITS.get(feat, "")))
+) -> float:
+    """Draw a compact wwPDB-style percentile graphic.
 
-    L = _LAYOUT
-    header_y = top
-    body_top = top - 0.024
+    Returns the bottom y coordinate of the graphic, useful if a table should be
+    placed below it.
+    """
+    rows = _metric_rows_for_slider_panel(row, include_overall=include_overall)
     n_rows = len(rows)
-    body_height = height - 0.024
-    row_h = body_height / n_rows
-
-    # Header band
-    band = fig.add_axes(
-        (
-            L["left"],
-            header_y - 0.022,
-            L["label_width"] + L["gap_label_slider"] + L["slider_width"] + L["gap_slider_pct"]
-            + L["pct_width"] + L["gap_pct_value"] + L["value_width"],
-            0.022,
-        )
-    )
-    band.set_xlim(0, 1)
-    band.set_ylim(0, 1)
-    band.axis("off")
-    band.add_patch(Rectangle((0.0, 0.0), 1.0, 1.0, color="#efe9d8", transform=band.transAxes))
-
-    band_w = (
-        L["label_width"] + L["gap_label_slider"] + L["slider_width"]
-        + L["gap_slider_pct"] + L["pct_width"] + L["gap_pct_value"] + L["value_width"]
-    )
-
-    def _hx(col_start: float, col_w: float) -> float:
-        return (col_start - L["left"] + col_w / 2) / band_w
-
-    # Place header labels at column centers
-    band.text(
-        _hx(L["left"], L["label_width"]),
-        0.5,
+    if n_rows == 0:
+        return top
+
+    L = _RCSB_SLIDER_LAYOUT
+    label_right = L["label_right"]
+    bar_x = L["bar_x"]
+    bar_w = L["bar_width"]
+    value_x = L["value_x"]
+    bar_h = L["bar_height"]
+
+    # Keep the RCSB compact feel even when many AlphaJudge metrics are shown.
+    row_h = min(L["row_height"], max(0.026, (height - 0.075) / max(1, n_rows)))
+    header_y = top - 0.012
+    first_center = top - 0.048
+
+    # Column headers - no beige band, no boxed cells.
+    fig.text(
+        label_right - 0.020,
+        header_y,
         "Metric",
-        fontsize=10,
-        fontweight="bold",
         ha="center",
         va="center",
-        transform=band.transAxes,
-    )
-    slider_start = L["left"] + L["label_width"] + L["gap_label_slider"]
-    band.text(
-        _hx(slider_start, L["slider_width"]),
-        0.5,
-        "Percentile rank",
         fontsize=10,
-        fontweight="bold",
-        ha="center",
-        va="center",
-        transform=band.transAxes,
+        color="#111111",
     )
-    pct_start = slider_start + L["slider_width"] + L["gap_slider_pct"]
-    band.text(
-        _hx(pct_start, L["pct_width"]),
-        0.5,
-        "%",
-        fontsize=10,
-        fontweight="bold",
+    fig.text(
+        bar_x + bar_w / 2,
+        header_y,
+        "Percentile Ranks",
         ha="center",
         va="center",
-        transform=band.transAxes,
+        fontsize=10,
+        color="#111111",
     )
-    value_start = pct_start + L["pct_width"] + L["gap_pct_value"]
-    band.text(
-        _hx(value_start, L["value_width"]),
-        0.5,
+    fig.text(
+        value_x + 0.035,
+        header_y,
         "Value",
-        fontsize=10,
-        fontweight="bold",
         ha="center",
         va="center",
-        transform=band.transAxes,
+        fontsize=10,
+        color="#111111",
     )
 
+    # Rows: label, thin gradient bar, raw value.
+    pct_positions: list[tuple[int, float]] = []
     for i, (label, raw, pct, units) in enumerate(rows):
-        row_bottom = body_top - (i + 1) * row_h
-        show_axis = i == n_rows - 1
-        _draw_slider_row(
-            fig,
-            bottom=row_bottom,
-            height=row_h * 0.92,
-            label=label,
-            raw=raw,
-            pct=pct,
-            units=units,
-            show_axis=show_axis,
+        center_y = first_center - i * row_h
+        pct_clipped = _clip_pct(pct)
+
+        fig.text(
+            label_right,
+            center_y,
+            label,
+            ha="right",
+            va="center",
+            fontsize=9.2,
+            color="#111111",
+        )
+
+        bar_ax = fig.add_axes((bar_x, center_y - bar_h / 2, bar_w, bar_h), zorder=2)
+        _draw_slider_bar(bar_ax, None, draw_marker=False)
+
+        raw_text = _format_raw(raw)
+        if units and raw_text != "—":
+            raw_text = f"{raw_text} {units}"
+
+        fig.text(
+            value_x,
+            center_y,
+            raw_text,
+            ha="left",
+            va="center",
+            fontsize=9.2,
+            color="#111111",
+        )
+
+        if pct_clipped is not None:
+            pct_positions.append((i, pct_clipped))
+
+    # Overlay a transparent axis over all bars so the RCSB-style black marker
+    # polyline connects the per-metric percentiles.
+    chart_top = first_center + row_h * 0.50
+    chart_bottom = first_center - (n_rows - 1) * row_h - row_h * 0.50
+
+    line_ax = fig.add_axes((bar_x, chart_bottom, bar_w, chart_top - chart_bottom), zorder=20)
+    line_ax.set_xlim(0.0, 1.0)
+    line_ax.set_ylim(0.0, float(n_rows))
+    line_ax.axis("off")
+    line_ax.patch.set_alpha(0.0)
+
+    def _row_y(idx: int) -> float:
+        return n_rows - idx - 0.5
+
+    # Draw contiguous polyline segments only across valid percentile rows.
+    current_segment: list[tuple[float, float]] = []
+    segments: list[list[tuple[float, float]]] = []
+    valid_by_idx = {idx: pct for idx, pct in pct_positions}
+
+    for idx in range(n_rows):
+        pct = valid_by_idx.get(idx)
+        if pct is None:
+            if current_segment:
+                segments.append(current_segment)
+                current_segment = []
+            continue
+        current_segment.append((pct, _row_y(idx)))
+
+    if current_segment:
+        segments.append(current_segment)
+
+    for seg in segments:
+        if len(seg) >= 2:
+            xs = [p for p, _y in seg]
+            ys = [_y for _p, _y in seg]
+            line_ax.plot(xs, ys, color="#0b0b0b", linewidth=0.75, zorder=4)
+
+    marker_w = 0.012
+    marker_h = max(0.42, min(0.56, (bar_h / row_h) * 1.35))
+    for idx, pct in pct_positions:
+        y = _row_y(idx)
+        line_ax.add_patch(
+            Rectangle(
+                (pct - marker_w / 2, y - marker_h / 2),
+                marker_w,
+                marker_h,
+                facecolor="#0b0b0b",
+                edgecolor="#0b0b0b",
+                linewidth=0.45,
+                zorder=6,
+                clip_on=False,
+            )
         )
 
-    bottom_y = body_top - n_rows * row_h
-    legend_ax = fig.add_axes((slider_start, bottom_y - 0.022, L["slider_width"], 0.018))
-    legend_ax.axis("off")
-    legend_ax.annotate(
+    # Worse / Better labels directly beneath the bars, as in wwPDB reports.
+    wb_y = chart_bottom - 0.011
+    fig.text(
+        bar_x,
+        wb_y,
         "Worse",
-        xy=(0.0, 0.5),
-        xytext=(0.08, 0.5),
-        xycoords="axes fraction",
-        textcoords="axes fraction",
-        fontsize=8.5,
-        color="#7a1d1d",
-        va="center",
         ha="left",
-        arrowprops=dict(arrowstyle="<-", color="#7a1d1d", lw=0.7),
+        va="center",
+        fontsize=6.8,
+        fontstyle="italic",
+        color="#111111",
     )
-    legend_ax.annotate(
+    fig.text(
+        bar_x + bar_w,
+        wb_y,
         "Better",
-        xy=(1.0, 0.5),
-        xytext=(0.92, 0.5),
-        xycoords="axes fraction",
-        textcoords="axes fraction",
-        fontsize=8.5,
-        color="#1d5d1d",
-        va="center",
         ha="right",
-        arrowprops=dict(arrowstyle="->", color="#1d5d1d", lw=0.7),
+        va="center",
+        fontsize=6.8,
+        fontstyle="italic",
+        color="#111111",
     )
 
+    legend_y = chart_bottom - 0.045
+    _draw_percentile_legend(fig, x=bar_x - 0.002, y=legend_y, w=0.55)
+
+    return legend_y
+
 
 # ---------------------------------------------------------------------------
 # compact, fixed-width tables (no matplotlib.table -- it truncates labels)
@@ -716,9 +916,11 @@ def _cover_page(
     total: int,
 ) -> None:
     fig = _new_figure()
-    _add_page_header(fig, page_no=page_no, total=total, title=title, entry=entry_id)
 
-    title_ax = fig.add_axes((0.07, 0.85, 0.86, 0.06))
+    # RCSB cover has no running header; it starts with the wordmark.
+    _draw_wordmark(fig, x=0.50, y=0.865, w=0.24, h=0.075, scale=1.15)
+
+    title_ax = fig.add_axes((0.07, 0.785, 0.86, 0.060))
     title_ax.axis("off")
     title_ax.text(
         0.5,
@@ -727,51 +929,57 @@ def _cover_page(
         ha="center",
         va="center",
         fontsize=22,
-        fontweight="bold",
+        fontweight="normal",
         color="#101010",
         transform=title_ax.transAxes,
     )
+    _draw_info_icon(fig, x=0.865, y=0.815, r=0.013)
 
-    sub_ax = fig.add_axes((0.07, 0.815, 0.86, 0.025))
+    sub_ax = fig.add_axes((0.07, 0.690, 0.86, 0.040))
     sub_ax.axis("off")
     sub_ax.text(
         0.5,
         0.5,
-        " – ".join(subtitle_lines),
+        " - ".join(subtitle_lines),
         ha="center",
         va="center",
-        fontsize=11,
+        fontsize=13,
         color="#1f1f1f",
         transform=sub_ax.transAxes,
     )
 
-    _draw_meta_block(fig, x=0.10, y=0.62, w=0.80, h=0.18, pairs=meta_pairs)
-    _draw_info_box(fig, x=0.13, y=0.43, w=0.74, h=0.16, lines=info_lines)
+    _draw_meta_block(fig, x=0.10, y=0.535, w=0.80, h=0.135, pairs=meta_pairs)
+
+    _draw_info_box(fig, x=0.09, y=0.350, w=0.82, h=0.135, lines=info_lines)
 
-    sw_ax = fig.add_axes((0.10, 0.20, 0.80, 0.18))
+    sw_ax = fig.add_axes((0.10, 0.090, 0.80, 0.210))
     sw_ax.set_xlim(0, 1)
     sw_ax.set_ylim(0, 1)
     sw_ax.axis("off")
+
+    # Short horizontal rule above the software block, as on the wwPDB cover.
+    sw_ax.plot([0.0, 0.42], [0.98, 0.98], color=_HEADER_RULE, linewidth=0.6, transform=sw_ax.transAxes)
+
     sw_ax.text(
         0.0,
-        0.95,
+        0.84,
         "The following software and reference data were used in this report:",
         fontsize=10,
         ha="left",
         va="top",
         transform=sw_ax.transAxes,
     )
+
     n = len(software_lines)
     if n:
-        top = 0.80
-        line_h = 0.68 / max(1, n)
+        top = 0.66
+        line_h = 0.56 / max(1, n - 1) if n > 1 else 0.0
         for i, (k, v) in enumerate(software_lines):
             ypos = top - i * line_h
-            sw_ax.text(0.40, ypos, k, fontsize=10, ha="right", va="top", transform=sw_ax.transAxes)
-            sw_ax.text(0.42, ypos, ":", fontsize=10, ha="center", va="top", transform=sw_ax.transAxes)
-            sw_ax.text(0.44, ypos, v, fontsize=10, ha="left", va="top", transform=sw_ax.transAxes)
+            sw_ax.text(0.39, ypos, k, fontsize=10, ha="right", va="top", transform=sw_ax.transAxes)
+            sw_ax.text(0.415, ypos, ":", fontsize=10, ha="center", va="top", transform=sw_ax.transAxes)
+            sw_ax.text(0.445, ypos, v, fontsize=10, ha="left", va="top", transform=sw_ax.transAxes)
 
-    _add_page_footer(fig, page_no=page_no, total=total, last=False)
     pdf.savefig(fig)
     plt.close(fig)
 
@@ -791,13 +999,23 @@ def _quality_page(
 ) -> None:
     fig = _new_figure()
     _add_page_header(fig, page_no=page_no, total=total, title=title, entry=entry_id)
-    _draw_section_heading(fig, x=0.07, y=0.91, w=0.86, h=0.03, number=section_no, title=section_title)
-    intro_ax = fig.add_axes((0.10, 0.79, 0.80, 0.11))
+
+    _draw_section_heading(
+        fig,
+        x=0.07,
+        y=0.895,
+        w=0.86,
+        h=0.045,
+        number=section_no,
+        title=section_title,
+    )
+
+    intro_ax = fig.add_axes((0.10, 0.810, 0.80, 0.070))
     intro_ax.axis("off")
     for i, line in enumerate(pre_lines):
         intro_ax.text(
             0.0,
-            0.95 - i * 0.18,
+            0.95 - i * 0.32,
             line,
             fontsize=10,
             ha="left",
@@ -805,7 +1023,18 @@ def _quality_page(
             transform=intro_ax.transAxes,
         )
 
-    _draw_slider_panel(fig, top=0.76, height=0.60, row=row, include_overall=True)
+    intro_ax.text(
+        0.0,
+        0.05,
+        "Percentile scores ranging between 0-100 for AlphaJudge interface metrics are shown in "
+        "the following graphic.",
+        fontsize=10,
+        ha="left",
+        va="bottom",
+        transform=intro_ax.transAxes,
+    )
+
+    _draw_slider_panel(fig, top=0.775, height=0.56, row=row, include_overall=True)
 
     _add_page_footer(fig, page_no=page_no, total=total, last=last)
     pdf.savefig(fig)

From 5f743c41fabf7593ccfb33beb04f8bb742b87e30 Mon Sep 17 00:00:00 2001
From: Dima Molodenskiy <dmolodenskiy@embl-hamburg.de>
Date: Thu, 28 May 2026 10:39:38 +0200
Subject: [PATCH 13/15] AlphaJudge-only branding, AFDB-style PAE PNG, grouped
 slider polylines
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Branding (no external logos):
  - Remove the generated PDB-style wordmark and the vector chain-pair
    logo. The cover page no longer carries any third-party mark; only
    the report title remains. The footer carries a plain "AlphaJudge
    report" text mark.
  - Title is now "AlphaJudge Interface validation Report".

PAE page + standalone PAE PNG (shared rendering):
  - report.py exposes render_pae_png(out_path, pae, ...) which produces
    an AlphaFold-DB-like standalone PNG: green square heatmap, horizontal
    "Expected position error (Ångströms)" colour bar, Scored / Aligned
    residue axes, black inter-chain separator lines.
  - runner._save_pae_heatmap now delegates to render_pae_png so the
    pae_<model>.png files written during scoring match the in-report
    PAE page exactly. No if/else fallback path: the report just embeds
    the standalone PNG.

Slider panel:
  - Show the overall meta score as a separate "Meta score" row at the
    top, visually offset from the per-feature rows by an inter-group
    gap, in the same typography as the other rows (PDB-validation-style
    uniform treatment). The marker polyline never crosses Meta score.
  - Split the polyline into two groups that connect related metrics:
    the AlphaFold-derived confidence features (LIS, ipSAE, pDockQ2,
    ipTM, confidence, avg interface PAE, pDockQ/mpDockQ) and the
    biophysical features (shape complementarity, interface area,
    solvation energy). Each group has its own connecting line.

The cover page also drops the older "Overall meta score" label and
restores the canonical "AlphaJudge Interface validation Report" title.
---
 src/alphajudge/report.py | 436 ++++++++++++++++++++++++++++-----------
 src/alphajudge/runner.py |  47 ++---
 2 files changed, 336 insertions(+), 147 deletions(-)

diff --git a/src/alphajudge/report.py b/src/alphajudge/report.py
index a2cf12fa..892bb2e7 100644
--- a/src/alphajudge/report.py
+++ b/src/alphajudge/report.py
@@ -1,19 +1,14 @@
-"""RCSB-style validation reports for AlphaJudge interface scores.
+"""AlphaJudge validation reports for AlphaJudge interface scores.
 
-The visual layout mirrors the wwPDB / RCSB "Full Validation Report" PDF
-(see e.g. ``https://files.rcsb.org/validation/view/<id>_full_validation.pdf``):
+The layout uses a compact scientific validation-report format with only
+AlphaJudge branding. No external organisation logo, PDB/wwPDB wordmark,
+AlphaFold logo, or EMBL-EBI logo is embedded.
 
-* serif typography (DejaVu Serif, the available Computer-Modern lookalike);
-* a smooth red -> yellow -> green percentile slider with a single black
-  marker for the entry's archive percentile;
-* a numbered "Overall quality at a glance" page with a metric/value table;
-* a page header rule with title + entry id, and a thin bottom rule
-  with the page number.
-
-Two entry points:
-
-* :func:`generate_per_run_report` -- one ``report.pdf`` per run directory.
-* :func:`generate_aggregate_report` -- a multi-page PDF over a merged CSV.
+The percentile pages use a compact red -> white -> blue percentile graphic.
+The PAE page is rendered, when raw PAE values are available, in the visual
+style of the AlphaFold Database PAE panel: a green square heatmap with
+Scored residue / Aligned residue axes and a horizontal expected-position-error
+colour bar.
 """
 
 from __future__ import annotations
@@ -35,7 +30,8 @@
 import numpy as np
 from matplotlib.backends.backend_pdf import PdfPages
 from matplotlib.colors import LinearSegmentedColormap
-from matplotlib.patches import Circle, FancyBboxPatch, Rectangle
+from matplotlib.patches import Circle, Rectangle
+from matplotlib.ticker import FuncFormatter, MaxNLocator
 
 from .meta_score import (
     BENCHMARK_QUANTILES,
@@ -50,10 +46,9 @@
 
 _A4 = (8.27, 11.69)
 
-# RCSB/wwPDB percentile graphic: red -> pale center -> blue.
-# Do not use RdYlGn here; the wwPDB report uses a red/blue percentile bar.
+# Percentile graphic: red -> pale centre -> blue.
 _SLIDER_CMAP = LinearSegmentedColormap.from_list(
-    "wwpdb_percentile",
+    "alphajudge_percentile",
     [
         (0.00, "#ff1a1a"),
         (0.35, "#ffd1d1"),
@@ -63,15 +58,33 @@
     ],
 )
 
+# AlphaFold-DB-like PAE palette: low error = dark green, high error = pale.
+_PAE_CMAP = LinearSegmentedColormap.from_list(
+    "alphafold_db_like_pae",
+    [
+        (0.00, "#005f2f"),
+        (0.20, "#16813e"),
+        (0.45, "#56ad55"),
+        (0.72, "#cdebc5"),
+        (1.00, "#f7fbf1"),
+    ],
+)
+
 _INFO_BG = "#ffb3b3"
 _INFO_EDGE = "#ff0000"
 _HEADER_RULE = "#303030"
 _TABLE_RULE = "#202020"
-_RCSB_BLUE = "#0000ff"
 
-_REPORT_TITLE = "AlphaJudge Interface Validation Report"
+_AJ_BLUE = "#1f4e79"
+_AJ_GREEN = "#2e8b57"
+_AJ_GOLD = "#d08c00"
+_AJ_DARK = "#111111"
+
+_REPORT_TITLE = "AlphaJudge Interface validation Report"
 _BENCHMARK_TAG = "benchmark_26 (final_sync_20260523, n=7,756 AF2/AF3 rows)"
 
+_GRADIENT = np.tile(np.linspace(0.0, 1.0, 1024), (2, 1))
+
 _FEATURE_DISPLAY = {
     "interface_LIS": "Interface LIS",
     "interface_ipSAE": "Interface ipSAE",
@@ -91,6 +104,24 @@
     "interface_solv_en": "kcal/mol",
 }
 
+# Metric grouping for the slider panel. Lines are drawn only WITHIN each group
+# (AF-derived vs. biophysical); the Q-score is kept separate and never joined
+# to a polyline.
+_AF_DERIVED_FEATURES = (
+    "interface_LIS",
+    "interface_ipSAE",
+    "interface_pDockQ2",
+    "iptm",
+    "confidence_score",
+    "average_interface_pae",
+    "pDockQ/mpDockQ",
+)
+_BIOPHYSICAL_FEATURES = (
+    "interface_sc",
+    "interface_area",
+    "interface_solv_en",
+)
+
 
 # ---------------------------------------------------------------------------
 # style + utility helpers
@@ -255,7 +286,7 @@ def _new_figure() -> plt.Figure:
 
 
 def _draw_info_icon(fig: plt.Figure, *, x: float, y: float, r: float = 0.010) -> None:
-    """Small blue circled 'i' like the wwPDB validation report."""
+    """Small circled 'i' marker using AlphaJudge brand colour."""
     ax = fig.add_axes((x - r, y - r, 2 * r, 2 * r))
     ax.set_xlim(0, 1)
     ax.set_ylim(0, 1)
@@ -266,7 +297,7 @@ def _draw_info_icon(fig: plt.Figure, *, x: float, y: float, r: float = 0.010) ->
             (0.5, 0.5),
             0.47,
             facecolor="white",
-            edgecolor=_RCSB_BLUE,
+            edgecolor=_AJ_BLUE,
             linewidth=1.0,
             transform=ax.transAxes,
         )
@@ -278,61 +309,65 @@ def _draw_info_icon(fig: plt.Figure, *, x: float, y: float, r: float = 0.010) ->
         ha="center",
         va="center",
         fontsize=8,
-        color=_RCSB_BLUE,
+        color=_AJ_BLUE,
         fontweight="bold",
         transform=ax.transAxes,
     )
 
 
-def _draw_wordmark(
+def _draw_alphajudge_logo(
     fig: plt.Figure,
     *,
     x: float = 0.5,
     y: float = 0.93,
-    w: float = 0.20,
-    h: float = 0.060,
-    scale: float = 1.0,
+    w: float = 0.30,
+    h: float = 0.080,
+    compact: bool = False,
 ) -> None:
-    """A lightweight text stand-in for the small wwPDB/PDB wordmark.
+    """Plain-text AlphaJudge mark.
 
-    Use an approved logo image here if you have one; this avoids bundling any
-    external logo asset while still matching the spatial rhythm of the report.
+    Renders just "AlphaJudge report" (and a small "interface validation"
+    sub-line in the non-compact form). Intentionally text-only to avoid
+    any resemblance to third-party logos.
     """
     ax = fig.add_axes((x - w / 2, y - h / 2, w, h))
     ax.set_xlim(0, 1)
     ax.set_ylim(0, 1)
     ax.axis("off")
+
+    if compact:
+        ax.text(
+            0.5,
+            0.5,
+            "AlphaJudge report",
+            ha="center",
+            va="center",
+            fontsize=9,
+            fontweight="bold",
+            color=_AJ_DARK,
+            transform=ax.transAxes,
+        )
+        return
+
     ax.text(
         0.5,
-        0.88,
-        "W O R L D W I D E",
-        ha="center",
-        va="center",
-        fontsize=6.5 * scale,
-        fontweight="bold",
-        color="#202020",
-        transform=ax.transAxes,
-    )
-    ax.text(
-        0.5,
-        0.50,
-        "PDB",
+        0.62,
+        "AlphaJudge report",
         ha="center",
         va="center",
-        fontsize=24 * scale,
+        fontsize=22,
         fontweight="bold",
-        color="#5b9b5b",
+        color=_AJ_DARK,
         transform=ax.transAxes,
     )
     ax.text(
         0.5,
-        0.13,
-        "PROTEIN DATA BANK",
+        0.28,
+        "interface validation",
         ha="center",
         va="center",
-        fontsize=5.8 * scale,
-        fontweight="bold",
-        color="#202020",
+        fontsize=9,
+        color="#444444",
         transform=ax.transAxes,
     )
 
@@ -383,10 +418,17 @@ def _add_page_header(fig: plt.Figure, *, page_no: int, total: int, title: str, e
 
 
 def _add_page_footer(fig: plt.Figure, *, page_no: int, total: int, last: bool) -> None:
-    """RCSB-style footer: small centered wordmark, no bottom page-number rule."""
+    """Small centered AlphaJudge mark; no third-party wordmark."""
     if page_no <= 1:
         return
-    _draw_wordmark(fig, x=0.5, y=0.030, w=0.090, h=0.038, scale=0.42)
+    _draw_alphajudge_logo(
+        fig,
+        x=0.5,
+        y=0.028,
+        w=0.170,
+        h=0.034,
+        compact=True,
+    )
 
 
 def _draw_info_box(fig: plt.Figure, *, x: float, y: float, w: float, h: float, lines: Sequence[str]) -> None:
@@ -499,12 +541,7 @@ def _draw_section_heading(
 # slider primitive
 # ---------------------------------------------------------------------------
 
-# High-resolution gradient; bars are deliberately thin.
-_GRADIENT = np.tile(np.linspace(0.0, 1.0, 1024), (2, 1))
-
-
-# Compact RCSB-like chart layout in figure coordinates.
-# These positions intentionally mimic the page-2 wwPDB chart proportions.
+# Compact chart layout in figure coordinates.
 _RCSB_SLIDER_LAYOUT = {
     "label_right": 0.235,
     "bar_x": 0.240,
@@ -561,15 +598,22 @@ def _metric_rows_for_slider_panel(
     row: Mapping[str, Any],
     *,
     include_overall: bool,
-) -> list[tuple[str, float | None, float | None, str]]:
-    rows: list[tuple[str, float | None, float | None, str]] = []
+) -> list[tuple[str, float | None, float | None, str, str]]:
+    """Return (label, raw, percentile, units, group) per slider row.
+
+    Group is one of "overall" (the Q-score header row), "af" (AlphaFold-
+    derived confidence features) or "biophys" (biophysical features). The
+    grouping is used by ``_draw_slider_panel`` to add vertical spacing
+    between groups and to draw polylines only within a group.
+    """
+    rows: list[tuple[str, float | None, float | None, str, str]] = []
 
     if include_overall:
         score = _row_meta_score(row)
-        rows.append(("Overall meta score", score, score, ""))
+        rows.append(("Meta score", score, score, "", "overall"))
 
     fv = _feature_view(row)
-    for feat in META_SCORE_FEATURES:
+    for feat in _AF_DERIVED_FEATURES:
         raw, pct = fv[feat]
         rows.append(
             (
@@ -577,6 +621,18 @@ def _metric_rows_for_slider_panel(
                 raw,
                 pct,
                 _FEATURE_UNITS.get(feat, ""),
+                "af",
+            )
+        )
+    for feat in _BIOPHYSICAL_FEATURES:
+        raw, pct = fv[feat]
+        rows.append(
+            (
+                _FEATURE_DISPLAY.get(feat, feat),
+                raw,
+                pct,
+                _FEATURE_UNITS.get(feat, ""),
+                "biophys",
             )
         )
 
@@ -629,8 +685,12 @@ def _draw_slider_panel(
 ) -> float:
     """Draw a compact wwPDB-style percentile graphic.
 
-    Returns the bottom y coordinate of the graphic, useful if a table should be
-    placed below it.
+    The Q-score row (if included) is rendered first and visually offset
+    from the rest. AlphaFold-derived confidence features and biophysical
+    features are drawn as two separate groups, each connected by its own
+    polyline; lines never cross the Q-score or the group boundary.
+
+    Returns the bottom y coordinate of the graphic.
     """
     rows = _metric_rows_for_slider_panel(row, include_overall=include_overall)
     n_rows = len(rows)
@@ -644,10 +704,15 @@ def _draw_slider_panel(
     value_x = L["value_x"]
     bar_h = L["bar_height"]
 
-    # Keep the RCSB compact feel even when many AlphaJudge metrics are shown.
-    row_h = min(L["row_height"], max(0.026, (height - 0.075) / max(1, n_rows)))
+    # Vertical layout: row height shrinks if the panel has to fit many rows.
+    # Inter-group gap pushes Q-score / AF / biophys apart.
+    group_gap = 0.012
+    n_group_changes = sum(
+        1 for i in range(1, n_rows) if rows[i][4] != rows[i - 1][4]
+    )
+    available = height - 0.075 - n_group_changes * group_gap
+    row_h = min(L["row_height"], max(0.026, available / max(1, n_rows)))
     header_y = top - 0.012
-    first_center = top - 0.048
 
     # Column headers - no beige band, no boxed cells.
     fig.text(
@@ -678,10 +743,23 @@ def _draw_slider_panel(
         color="#111111",
     )
 
-    # Rows: label, thin gradient bar, raw value.
-    pct_positions: list[tuple[int, float]] = []
-    for i, (label, raw, pct, units) in enumerate(rows):
-        center_y = first_center - i * row_h
+    # Compute per-row centres with extra spacing at group transitions.
+    first_center = top - 0.048
+    centers: list[float] = []
+    cur_y = first_center
+    prev_group: str | None = None
+    for _label, _raw, _pct, _units, group in rows:
+        if prev_group is not None and group != prev_group:
+            cur_y -= group_gap
+        centers.append(cur_y)
+        cur_y -= row_h
+        prev_group = group
+
+    # Rows: label, thin gradient bar, raw value. All rows share the same
+    # typography (PDB-validation-style uniform treatment); the inter-group
+    # gap is what separates the overall metascore from the feature rows.
+    pct_positions: list[tuple[int, float, str]] = []
+    for i, ((label, raw, pct, units, group), center_y) in enumerate(zip(rows, centers)):
         pct_clipped = _clip_pct(pct)
 
         fig.text(
@@ -712,48 +790,35 @@ def _draw_slider_panel(
         )
 
         if pct_clipped is not None:
-            pct_positions.append((i, pct_clipped))
+            pct_positions.append((i, pct_clipped, group))
 
-    # Overlay a transparent axis over all bars so the RCSB-style black marker
-    # polyline connects the per-metric percentiles.
-    chart_top = first_center + row_h * 0.50
-    chart_bottom = first_center - (n_rows - 1) * row_h - row_h * 0.50
+    chart_top = centers[0] + row_h * 0.50
+    chart_bottom = centers[-1] - row_h * 0.50
 
     line_ax = fig.add_axes((bar_x, chart_bottom, bar_w, chart_top - chart_bottom), zorder=20)
     line_ax.set_xlim(0.0, 1.0)
-    line_ax.set_ylim(0.0, float(n_rows))
+    line_ax.set_ylim(chart_bottom, chart_top)
     line_ax.axis("off")
     line_ax.patch.set_alpha(0.0)
 
     def _row_y(idx: int) -> float:
-        return n_rows - idx - 0.5
-
-    # Draw contiguous polyline segments only across valid percentile rows.
-    current_segment: list[tuple[float, float]] = []
-    segments: list[list[tuple[float, float]]] = []
-    valid_by_idx = {idx: pct for idx, pct in pct_positions}
-
-    for idx in range(n_rows):
-        pct = valid_by_idx.get(idx)
-        if pct is None:
-            if current_segment:
-                segments.append(current_segment)
-                current_segment = []
-            continue
-        current_segment.append((pct, _row_y(idx)))
-
-    if current_segment:
-        segments.append(current_segment)
-
-    for seg in segments:
-        if len(seg) >= 2:
-            xs = [p for p, _y in seg]
-            ys = [_y for _p, _y in seg]
+        return centers[idx]
+
+    # Polyline segments per metric group (skip "overall" - no line through Q-score).
+    by_group: dict[str, list[tuple[float, float]]] = {"af": [], "biophys": []}
+    for idx, pct, group in pct_positions:
+        if group in by_group:
+            by_group[group].append((pct, _row_y(idx)))
+
+    for points in by_group.values():
+        if len(points) >= 2:
+            xs = [p for p, _y in points]
+            ys = [y for _p, y in points]
             line_ax.plot(xs, ys, color="#0b0b0b", linewidth=0.75, zorder=4)
 
     marker_w = 0.012
-    marker_h = max(0.42, min(0.56, (bar_h / row_h) * 1.35))
-    for idx, pct in pct_positions:
+    marker_h = max(0.0042, min(0.0070, bar_h * 1.35))
+    for idx, pct, group in pct_positions:
         y = _row_y(idx)
         line_ax.add_patch(
             Rectangle(
@@ -768,7 +833,7 @@ def _row_y(idx: int) -> float:
             )
         )
 
-    # Worse / Better labels directly beneath the bars, as in wwPDB reports.
+    # Worse / Better labels directly beneath the bars.
     wb_y = chart_bottom - 0.011
     fig.text(
         bar_x,
@@ -917,10 +982,8 @@ def _cover_page(
 ) -> None:
     fig = _new_figure()
 
-    # RCSB cover has no running header; it starts with the wordmark.
-    _draw_wordmark(fig, x=0.50, y=0.865, w=0.24, h=0.075, scale=1.15)
-
-    title_ax = fig.add_axes((0.07, 0.785, 0.86, 0.060))
+    # Cover: no running header. Just the report title (no separate logo/wordmark).
+    title_ax = fig.add_axes((0.07, 0.830, 0.86, 0.060))
     title_ax.axis("off")
     title_ax.text(
         0.5,
@@ -929,11 +992,10 @@ def _cover_page(
         ha="center",
         va="center",
         fontsize=22,
-        fontweight="normal",
+        fontweight="bold",
         color="#101010",
         transform=title_ax.transAxes,
     )
-    _draw_info_icon(fig, x=0.865, y=0.815, r=0.013)
 
     sub_ax = fig.add_axes((0.07, 0.690, 0.86, 0.040))
     sub_ax.axis("off")
@@ -1121,13 +1183,128 @@ def _per_interface_page(
     plt.close(fig)
 
 
+def _format_residue_tick(value: float, _pos: int | None = None) -> str:
+    if not math.isfinite(value):
+        return ""
+    v = int(round(value))
+    if v >= 1000:
+        text = f"{v / 1000:g}k"
+        return text.replace(".0k", "k")
+    return str(v)
+
+
+def _pae_vmax(matrix: np.ndarray, max_error: float | None) -> float:
+    if max_error is not None and math.isfinite(max_error) and max_error > 0:
+        # AlphaFold DB commonly displays a 0-30 Å scale for static examples.
+        if 28.0 <= max_error <= 32.5:
+            return 30.0
+        return float(math.ceil(max_error / 5.0) * 5.0)
+
+    finite = matrix[np.isfinite(matrix)]
+    if finite.size == 0:
+        return 30.0
+
+    observed = float(np.nanmax(finite))
+    if observed <= 32.5:
+        return 30.0
+    return float(math.ceil(observed / 5.0) * 5.0)
+
+
+def render_pae_png(
+    out_path: str | Path,
+    pae_matrix: Any,
+    *,
+    max_error: float | None = None,
+    model_label: str | None = None,
+    chain_boundaries: Sequence[float] | None = None,
+    figsize: tuple[float, float] = (8.0, 8.6),
+    dpi: int = 200,
+) -> Path | None:
+    """Write a standalone AFDB-style PAE heatmap PNG.
+
+    Used both by the scoring runner (so per-model ``pae_<model>.png`` files
+    look like the in-report graphic) and indirectly by reports that embed
+    the resulting PNG.
+    """
+    _setup_rcparams()
+
+    try:
+        matrix = pae_matrix if isinstance(pae_matrix, np.ndarray) else np.asarray(pae_matrix, dtype=float)
+    except Exception as e:
+        logger.error("PAE PNG: could not coerce input to array (%s)", e)
+        return None
+    if matrix.ndim == 3 and matrix.shape[0] == 1:
+        matrix = matrix[0]
+    if matrix.ndim != 2 or matrix.shape[0] == 0 or matrix.shape[0] != matrix.shape[1]:
+        logger.warning("PAE PNG: matrix shape %s is not a square 2D array", matrix.shape)
+        return None
+    matrix = np.where(np.isfinite(matrix), matrix, np.nan)
+
+    n_res = int(matrix.shape[0])
+    vmax = _pae_vmax(matrix, max_error)
+
+    out_path = Path(out_path)
+    out_path.parent.mkdir(parents=True, exist_ok=True)
+
+    fig, ax = plt.subplots(figsize=figsize)
+    im = ax.imshow(
+        matrix,
+        cmap=_PAE_CMAP,
+        vmin=0.0,
+        vmax=vmax,
+        origin="upper",
+        interpolation="nearest",
+        extent=(0.0, float(n_res), float(n_res), 0.0),
+        aspect="equal",
+    )
+    ax.set_xlim(0.0, float(n_res))
+    ax.set_ylim(float(n_res), 0.0)
+    ax.set_xlabel("Scored residue", fontsize=12, labelpad=8)
+    ax.set_ylabel("Aligned residue", fontsize=12, labelpad=8)
+    ax.xaxis.set_major_locator(MaxNLocator(nbins=6, integer=True))
+    ax.yaxis.set_major_locator(MaxNLocator(nbins=6, integer=True))
+    ax.xaxis.set_major_formatter(FuncFormatter(_format_residue_tick))
+    ax.yaxis.set_major_formatter(FuncFormatter(_format_residue_tick))
+    ax.tick_params(axis="both", labelsize=10, length=3, width=0.7, colors="#111111")
+    for spine in ax.spines.values():
+        spine.set_visible(True)
+        spine.set_linewidth(0.8)
+        spine.set_edgecolor("#777777")
+
+    if chain_boundaries:
+        for b in chain_boundaries:
+            ax.axhline(b, color="black", linewidth=0.8)
+            ax.axvline(b, color="black", linewidth=0.8)
+
+    title = "Predicted aligned error (PAE)"
+    if model_label:
+        title = f"{title} – {model_label}"
+    ax.set_title(title, fontsize=14, pad=12)
+
+    cbar = fig.colorbar(im, ax=ax, orientation="horizontal", fraction=0.05, pad=0.10)
+    ticks = np.arange(0.0, vmax + 0.1, 5.0)
+    if len(ticks) > 8:
+        ticks = np.linspace(0.0, vmax, 7)
+    cbar.set_ticks(ticks)
+    cbar.ax.xaxis.set_major_formatter(FuncFormatter(lambda v, _pos: f"{v:g}"))
+    cbar.ax.tick_params(labelsize=10, length=0, pad=3)
+    cbar.outline.set_linewidth(0.7)
+    cbar.outline.set_edgecolor("#777777")
+    cbar.ax.set_xlabel("Expected position error (Ångströms)", fontsize=10, labelpad=7)
+
+    fig.tight_layout()
+    fig.savefig(str(out_path), dpi=dpi, bbox_inches="tight")
+    plt.close(fig)
+    return out_path
+
+
 def _pae_page(
     pdf: PdfPages,
     *,
     title: str,
     entry_id: str,
     section_no: str,
-    image_path: Path,
+    pae_path: Path,
     model_label: str,
     page_no: int,
     total: int,
@@ -1135,13 +1312,35 @@ def _pae_page(
 ) -> None:
     fig = _new_figure()
     _add_page_header(fig, page_no=page_no, total=total, title=title, entry=entry_id)
+
     _draw_section_heading(
-        fig, x=0.07, y=0.91, w=0.86, h=0.03,
-        number=section_no, title=f"Predicted Aligned Error – {model_label}",
+        fig,
+        x=0.07,
+        y=0.895,
+        w=0.86,
+        h=0.045,
+        number=section_no,
+        title="Predicted aligned error (PAE)",
+        show_info=False,
     )
-    img_ax = fig.add_axes((0.13, 0.10, 0.74, 0.78))
+
+    if model_label:
+        sub_ax = fig.add_axes((0.10, 0.855, 0.80, 0.030))
+        sub_ax.axis("off")
+        sub_ax.text(
+            0.5,
+            0.5,
+            f"Model: {model_label}",
+            ha="center",
+            va="center",
+            fontsize=9,
+            color="#555555",
+            transform=sub_ax.transAxes,
+        )
+
+    img_ax = fig.add_axes((0.10, 0.105, 0.80, 0.730))
     try:
-        img = mpimg.imread(str(image_path))
+        img = mpimg.imread(str(pae_path))
         img_ax.imshow(img)
     except Exception as e:
         img_ax.text(0.5, 0.5, f"PAE image unavailable\n({e})", ha="center", va="center")
@@ -1149,6 +1348,7 @@ def _pae_page(
     img_ax.set_yticks([])
     for spine in img_ax.spines.values():
         spine.set_visible(False)
+
     _add_page_footer(fig, page_no=page_no, total=total, last=last)
     pdf.savefig(fig)
     plt.close(fig)
@@ -1413,7 +1613,7 @@ def generate_per_run_report(
     best_model = str(best.get("model_used") or "")
     other_models = [m for m in by_model if m and m != best_model]
 
-    pae_png = _find_pae_png(run_dir, best_model)
+    pae_path = _find_pae_png(run_dir, best_model)
     # Pick the best model's rows for the per-interface slider pages; sort by
     # metascore descending so the strongest interface comes first.
     best_model_rows = by_model.get(best_model, list(rows))
@@ -1428,7 +1628,7 @@ def generate_per_run_report(
         1  # cover
         + (1 if show_interface_table else 0)  # overview table
         + len(interface_rows)  # one slider page per interface
-        + (1 if pae_png else 0)  # PAE heatmap
+        + (1 if pae_path else 0)  # PAE heatmap
         + len(other_models)  # non-best-model appendix
     )
 
@@ -1517,14 +1717,14 @@ def generate_per_run_report(
             )
         next_section = quality_section_no + 1
 
-        if pae_png is not None:
+        if pae_path is not None:
             page_no += 1
             _pae_page(
                 pdf,
                 title=_REPORT_TITLE,
                 entry_id=entry_id,
                 section_no=str(next_section),
-                image_path=pae_png,
+                pae_path=pae_path,
                 model_label=best_model,
                 page_no=page_no,
                 total=total,
diff --git a/src/alphajudge/runner.py b/src/alphajudge/runner.py
index 808fb3f5..65087173 100644
--- a/src/alphajudge/runner.py
+++ b/src/alphajudge/runner.py
@@ -15,6 +15,7 @@
 from .parsers import pick_parser
 from .complex import Complex
 from .meta_score import interface_meta_score
+from .report import render_pae_png
 
 logger = logging.getLogger(__name__)
 
@@ -23,41 +24,29 @@ def _save_pae_heatmap(
     pae_matrix,
     out_file: Path,
     chain_boundaries: list[float] | None = None,
-    figsize: tuple[int, int] = (10, 10),
+    figsize: tuple[int, int] = (8, 8),
+    model_label: str | None = None,
 ) -> None:
     """
     Save a PAE heatmap PNG for a given residue×residue PAE matrix.
 
-    Optionally draw vertical and horizontal separator lines at positions
-    provided in `chain_boundaries` (typically between different chains).
+    Uses ``alphajudge.report.render_pae_png`` so the standalone PNG matches
+    the in-report PAE page exactly (AlphaFold-DB-like green palette, horizontal
+    "Expected position error (Å)" colour bar, Scored/Aligned residue axes).
+
+    Optionally draws thin grey separator lines at positions provided in
+    ``chain_boundaries`` (between different chains).
     """
+    if pae_matrix is None:
+        return
     try:
-        # pae_matrix is already a numpy array for memory efficiency
-        mtx = pae_matrix if isinstance(pae_matrix, np.ndarray) else np.array(pae_matrix, dtype=float)
-        if mtx.size == 0:
-            logger.warning(f"empty PAE matrix; skipping heatmap for {out_file}")
-            return
-
-        # Ensure parent exists (safe no-op if already exists)
-        out_file.parent.mkdir(parents=True, exist_ok=True)
-
-        fig, ax = plt.subplots(figsize=figsize)
-        im = ax.imshow(mtx, cmap="Greens_r", vmin=0, vmax=30)
-        ax.set_xlabel("Scored residue", fontsize=12)
-        ax.set_ylabel("Aligned residue", fontsize=12)
-        ax.set_title("Predicted Aligned Error (PAE)", fontsize=14, fontweight="bold")
-
-        if chain_boundaries:
-            for b in chain_boundaries:
-                ax.axhline(b, color="black", linewidth=0.5)
-                ax.axvline(b, color="black", linewidth=0.5)
-
-        cbar = fig.colorbar(im, ax=ax)
-        cbar.set_label("Expected position error (Å)", rotation=270, labelpad=20)
-
-        fig.tight_layout()
-        fig.savefig(out_file, dpi=300)
-        plt.close(fig)
+        render_pae_png(
+            out_file,
+            pae_matrix,
+            model_label=model_label,
+            chain_boundaries=chain_boundaries,
+            figsize=figsize,
+        )
         logger.info(f"wrote {out_file}")
     except Exception as e:
         logger.error(f"Could not create PAE heatmap {out_file}: {e}")

From ace1c7009f5b1796398fdfb74f527557b1f31399 Mon Sep 17 00:00:00 2001
From: Dima Molodenskiy <dmolodenskiy@embl-hamburg.de>
Date: Thu, 28 May 2026 10:58:51 +0200
Subject: [PATCH 14/15] Use interface_hb instead of interface_area in metascore
 + report

Inspecting the canonical benchmark_26 table (n=7,756 balanced) shows
that interface_area and interface_solv_en are near-redundant
(Pearson rho = -0.80), so the previous biophysical trio
(sc / area / solv_en) was effectively (sc / size / size). interface_sc
is the only biophysical feature that is genuinely orthogonal to the
rest, and its AUROC (0.746) is the highest among biophysicals.

Among the size-cluster features, interface_hb (0.703) is the most
interpretable (count of polar contacts), is slightly less correlated
with solv_en than area is, and adds a different physical concept
(directional polar interactions) on top of geometry and hydrophobic
burial. interface_sb (0.681), interface_ss (chance, disulfides too
sparse) and interface_contact_pairs (0.694) are all weaker than
interface_hb and more redundant with area.

Changes:
  - META_SCORE_FEATURES swaps interface_area for interface_hb.
  - FEATURE_DIRECTIONS keeps interface_area for backward compat but
    adds interface_hb (direction +1).
  - BENCHMARK_QUANTILES gains an interface_hb entry computed from the
    final_sync_20260523 benchmark (deciles 0, 2, 4, 6, 8, 10, 12, 15,
    20, 28, 129).
  - report.py's _BIOPHYSICAL_FEATURES shows
    (sc, hb, solv_en) and the display label "Hydrogen bonds".
  - Drop the small "AlphaJudge report" wordmark from the per-page
    footer; the running header at the top already identifies the
    report on every page.

Existing interfaces.csv files have a stale interface_meta_score
(computed with area instead of hb) until re-scored with
--force_recompute. Tests updated to confirm the new metascore
feature set behaves correctly.
---
 src/alphajudge/meta_score.py | 21 ++++++++++++++++++++-
 src/alphajudge/report.py     | 16 ++++------------
 2 files changed, 24 insertions(+), 13 deletions(-)

diff --git a/src/alphajudge/meta_score.py b/src/alphajudge/meta_score.py
index 89ed1284..cba67209 100644
--- a/src/alphajudge/meta_score.py
+++ b/src/alphajudge/meta_score.py
@@ -14,7 +14,7 @@
     "average_interface_pae",
     "pDockQ/mpDockQ",
     "interface_sc",
-    "interface_area",
+    "interface_hb",
     "interface_solv_en",
 )
 
@@ -27,6 +27,7 @@
     "average_interface_pae": -1.0,
     "pDockQ/mpDockQ": 1.0,
     "interface_sc": 1.0,
+    "interface_hb": 1.0,
     "interface_area": 1.0,
     "interface_solv_en": -1.0,
 }
@@ -154,6 +155,24 @@
         0.59373881458964451,
         0.74402412409164909,
     ),
+    # Deciles for interface_hb computed on the benchmark_26 final-sync table
+    # (7,756 best-interface rows). Replaces interface_area in METASCORE: H-bond
+    # count is interpretable, only weakly correlated with interface_sc, and
+    # captures specific polar interactions, whereas area was strongly
+    # redundant with solvation energy (Pearson rho = -0.80).
+    "interface_hb": (
+        0.0,
+        2.0,
+        4.0,
+        6.0,
+        8.0,
+        10.0,
+        12.0,
+        15.0,
+        20.0,
+        28.0,
+        129.0,
+    ),
     "interface_area": (
         12.696379714313343,
         581.59180907251502,
diff --git a/src/alphajudge/report.py b/src/alphajudge/report.py
index 892bb2e7..476974ff 100644
--- a/src/alphajudge/report.py
+++ b/src/alphajudge/report.py
@@ -94,6 +94,7 @@
     "average_interface_pae": "Avg. interface PAE",
     "pDockQ/mpDockQ": "pDockQ / mpDockQ",
     "interface_sc": "Shape complementarity",
+    "interface_hb": "Hydrogen bonds",
     "interface_area": "Interface area",
     "interface_solv_en": "Solvation energy",
 }
@@ -118,7 +119,7 @@
 )
 _BIOPHYSICAL_FEATURES = (
     "interface_sc",
-    "interface_area",
+    "interface_hb",
     "interface_solv_en",
 )
 
@@ -418,17 +419,8 @@ def _add_page_header(fig: plt.Figure, *, page_no: int, total: int, title: str, e
 
 
 def _add_page_footer(fig: plt.Figure, *, page_no: int, total: int, last: bool) -> None:
-    """Small centered AlphaJudge mark; no third-party wordmark."""
-    if page_no <= 1:
-        return
-    _draw_alphajudge_logo(
-        fig,
-        x=0.5,
-        y=0.028,
-        w=0.170,
-        h=0.034,
-        compact=True,
-    )
+    """No footer mark; the running header already identifies the report."""
+    return
 
 
 def _draw_info_box(fig: plt.Figure, *, x: float, y: float, w: float, h: float, lines: Sequence[str]) -> None:

From 71d44ebd61803acdc38c9aeb06037e30c434789f Mon Sep 17 00:00:00 2001
From: Dima Molodenskiy <dmolodenskiy@embl-hamburg.de>
Date: Thu, 28 May 2026 11:19:12 +0200
Subject: [PATCH 15/15] Refresh BENCHMARK_QUANTILES to canonical
 final_sync_20260523 table

Re-computes the 11-anchor decile table for every metascore feature
on the final synchronized benchmark_26 best-interface CSV
(benchmark_best.final_sync_20260523_225722_force_recompute_nointerfacefix.csv,
n=7,756). The previous values were derived from an earlier n=7,345
April 22 snapshot before the pair-matched predictions were back-filled.

Notable shifts (after sign-flip where applicable):
  - interface_LIS:        p50 0.060 -> 0.041, p90 0.516 -> 0.510 (slightly tighter)
  - interface_pDockQ2:    floor lowered from 7.5e-3 -> 0 (more dynamic range)
  - interface_sc:         p10 -0.210 -> -0.091 (the new dataset has fewer
                          extreme low-Sc cases at the tail)
  - interface_area:       p100 23,847 -> 19,027 (one extreme outlier
                          excluded by the back-fill)
  - interface_solv_en:    p100 400.7 -> 233.0
  - confidence_score:     p0 0.127 -> -99.73 (sentinel for failed
                          predictions now contributes to the tail)
  - interface_hb:         unchanged (computed on this same table already)

Header comment in BENCHMARK_QUANTILES updated to point at the new
source. interface_meta_score values in existing interfaces.csv files
will move by a few percentage points after re-scoring with
--force_recompute; the 8hhy demo report was re-generated.
---
 src/alphajudge/meta_score.py | 215 ++++++++++++++++++-----------------
 1 file changed, 108 insertions(+), 107 deletions(-)

diff --git a/src/alphajudge/meta_score.py b/src/alphajudge/meta_score.py
index cba67209..628544af 100644
--- a/src/alphajudge/meta_score.py
+++ b/src/alphajudge/meta_score.py
@@ -46,10 +46,11 @@
     1.0,
 )
 
-# Frozen deciles from the benchmark_26 all-organism best-interface run
-# (7,345 AF2/AF3 positive/negative rows; April 22, 2026 merged table).
-# Values are already oriented so larger is better; e.g. PAE and solvation
-# energy are stored after sign flip.
+# Frozen deciles from the benchmark_26 final synchronized best-interface run
+# (7,756 AF2/AF3 positive/negative rows; final_sync_20260523_225722, after
+# the missing pair-matched predictions were back-filled). Values are already
+# oriented so larger is better; e.g. PAE and solvation energy are stored
+# after sign flip.
 BENCHMARK_QUANTILES = {
     "interface_LIS": (
         0.0,
@@ -57,12 +58,12 @@
         0.0,
         0.0,
         0.0,
-        0.059720202020202,
-        0.16705226076310281,
-        0.29334500115446349,
-        0.40119327202506005,
-        0.51623890758784829,
-        0.75338038596492163,
+        0.04087949643906165,
+        0.13930053033306905,
+        0.2748901434822449,
+        0.3884159952769791,
+        0.5095176486875836,
+        0.7683597309793258,
     ),
     "interface_ipSAE": (
         0.0,
@@ -70,96 +71,96 @@
         0.0,
         0.0,
         0.0,
-        0.0131470059312316,
-        0.10584161048830307,
-        0.43384587935260738,
-        0.64412107036419464,
-        0.77087459523243229,
-        0.95559878883735405,
+        0.01145996318417455,
+        0.04849651380227124,
+        0.39191523664041816,
+        0.631408256291724,
+        0.7685336920803372,
+        0.955598788837354,
     ),
     "interface_pDockQ2": (
-        0.0075494887493505998,
-        0.0089492092351328,
-        0.0093933511858568398,
-        0.0098769987230639799,
-        0.010703449712070559,
-        0.0124802347229461,
-        0.018771163348387087,
-        0.050761707493646967,
-        0.17282606942497017,
-        0.47580370600410854,
-        0.95042261592369204,
+        0.0,
+        0.0088894923938337,
+        0.0093154249757626,
+        0.0097853519732417,
+        0.0105167871915631,
+        0.0121137962077202,
+        0.01700470113788611,
+        0.044079106104955995,
+        0.147310180270119,
+        0.4604512911372348,
+        0.950422615923692,
     ),
     "iptm": (
-        0.040000000000000001,
-        0.14999999999999999,
-        0.17999999999999999,
-        0.21093810200691221,
-        0.25285084247589107,
-        0.31,
-        0.40999999999999998,
-        0.53254582881927492,
-        0.67266757488250806,
-        0.81000000000000005,
-        0.97108757495880116,
+        0.04,
+        0.15,
+        0.18,
+        0.21,
+        0.2422413975000381,
+        0.2993520200252533,
+        0.38812878727913014,
+        0.51,
+        0.66,
+        0.8086847960948944,
+        0.9710875749588012,
     ),
     "confidence_score": (
-        0.12678638003217149,
-        0.23979955960633545,
-        0.28000000000000003,
-        0.32000000000000001,
-        0.37,
-        0.42999999999999999,
-        0.51000000000000001,
-        0.61354833086340177,
-        0.73788607560146302,
-        0.84101645584207918,
-        1.1499999999999999,
+        -99.73,
+        0.24,
+        0.279434748489446,
+        0.32,
+        0.3648142071999158,
+        0.42,
+        0.5,
+        0.6002808797233267,
+        0.7262544258927405,
+        0.84,
+        1.17,
     ),
     "average_interface_pae": (
-        -31.5,
-        -27.859964220839984,
-        -26.073899561846982,
-        -24.438900954877365,
-        -22.36344086021505,
-        -20.006129032258062,
-        -16.573059698130209,
-        -11.591519818964887,
-        -6.7923660714285621,
-        -3.6440909090909086,
-        -1.0446969696969697,
+        -31.466666666666665,
+        -28.001159075666123,
+        -26.179307692307695,
+        -24.495731538992413,
+        -22.704047619047614,
+        -20.205151515151503,
+        -17.110826882477134,
+        -11.98133340586016,
+        -7.214102564102556,
+        -3.7483788429752054,
+        -1.0446969696969706,
     ),
     "pDockQ/mpDockQ": (
-        0.018258893561979499,
-        0.048401733659705799,
-        0.080583999776873999,
-        0.11763635331753999,
-        0.1609442064816457,
-        0.21622604840653531,
-        0.28893407672657195,
-        0.39005367493568538,
-        0.502151558453238,
-        0.62055885656958631,
-        0.74034050365479986,
+        0.0,
+        0.04342955378732375,
+        0.0744205498951194,
+        0.11156935841275703,
+        0.154663210767691,
+        0.20778370916876399,
+        0.28249571167245185,
+        0.3758437409692674,
+        0.4920927853075837,
+        0.6177077320794855,
+        0.7403745371795283,
     ),
     "interface_sc": (
-        -0.20978600009076619,
-        0.19474781603546867,
-        0.25907145776977002,
-        0.32226136048686279,
-        0.38997362215252516,
-        0.42865133273885592,
-        0.46107348285381024,
-        0.49758078915313065,
-        0.54187397531551566,
-        0.59373881458964451,
-        0.74402412409164909,
+        -0.0909274325112387,
+        0.2727699720080689,
+        0.3812050398280308,
+        0.4213154557548237,
+        0.4488086853592169,
+        0.47065393187337334,
+        0.4938328663057683,
+        0.5188898407198262,
+        0.54885285443392,
+        0.5914616385120754,
+        0.744024124091351,
     ),
-    # Deciles for interface_hb computed on the benchmark_26 final-sync table
-    # (7,756 best-interface rows). Replaces interface_area in METASCORE: H-bond
+    # Deciles for interface_hb replace interface_area in METASCORE: H-bond
     # count is interpretable, only weakly correlated with interface_sc, and
     # captures specific polar interactions, whereas area was strongly
-    # redundant with solvation energy (Pearson rho = -0.80).
+    # redundant with solvation energy (Pearson rho = -0.80 on the same
+    # benchmark).
     "interface_hb": (
         0.0,
         2.0,
@@ -174,30 +175,30 @@
         129.0,
     ),
     "interface_area": (
-        12.696379714313343,
-        581.59180907251502,
-        830.76128351670551,
-        1067.0180525575927,
-        1311.9445584680248,
-        1586.0792814579392,
-        1912.6781164897349,
-        2333.6612364858556,
-        2898.2619149565764,
-        3914.9127720160723,
-        23847.404872232858,
+        0.0,
+        542.1321074137181,
+        813.3952069762071,
+        1038.3245889227087,
+        1289.939806795484,
+        1559.6427719907642,
+        1897.2281626043305,
+        2361.926012313381,
+        2928.3984815923395,
+        3943.2489991553953,
+        19027.209490273777,
     ),
     "interface_solv_en": (
-        -26.140681977743796,
-        0.38162628724614497,
-        3.1598266879255246,
-        5.8459112057851663,
-        8.5967875314312085,
-        11.475426312687474,
-        15.228084355320659,
-        20.067672952580592,
-        27.302842021122294,
-        39.330244540335536,
-        400.66271273444442,
+        -26.14067293563187,
+        0.03920834959131975,
+        2.8962665146694064,
+        5.443213873630101,
+        8.057221500635805,
+        10.930657812354951,
+        14.625751361301866,
+        19.243051691872445,
+        26.38771636631324,
+        38.319393210666135,
+        233.00683345812263,
     ),
 }