motief/analysis/right_wing/overton_breakpoint_analysis.py

#!/usr/bin/env python3
"""U2: Quantify the 2024 Overton Window breakpoint in Dutch parliament.

Descriptive analysis of centrist support, pass rates, and content extremity
for right-wing motions — with coalition control via opposition-only filtering,
domain decomposition, and a baseline comparison.

Usage:
    uv run python analysis/right_wing/overton_breakpoint_analysis.py

Output:
    reports/overton_window/breakpoint_analysis.md
    reports/overton_window/breakpoint_figure_1.png
    reports/overton_window/breakpoint_figure_2.png
"""

from __future__ import annotations

import json
import logging
import random
import re
import sys
from pathlib import Path
from typing import Any

import duckdb
import matplotlib
import numpy as np

matplotlib.use("Agg")
import matplotlib.pyplot as plt
import matplotlib.ticker as mticker

ROOT = Path(__file__).parent.parent.parent.resolve()
if str(ROOT) not in sys.path:
    sys.path.insert(0, str(ROOT))

from analysis.config import CANONICAL_LEFT, CANONICAL_RIGHT, PARTY_COLOURS

CANONICAL_CENTRIST = frozenset({"VVD", "D66", "CDA", "NSC", "BBB", "CU"})

logging.basicConfig(level=logging.INFO, format="%(asctime)s %(levelname)s %(message)s")
logger = logging.getLogger(__name__)

DB_PATH = str(ROOT / "data" / "motions.db")
REPORTS_DIR = ROOT / "reports" / "overton_window"
REPORTS_DIR.mkdir(parents=True, exist_ok=True)

CANONICAL_CENTRIST_SET = set(CANONICAL_CENTRIST)  # nb: config defines as frozenset
CANONICAL_LEFT_SET = set(CANONICAL_LEFT)
CANONICAL_RIGHT_SET = set(CANONICAL_RIGHT)

COALITION: dict[int, set[str]] = {
    2016: {"VVD", "PvdA"},
    2017: {"VVD", "PvdA"},
    2018: {"VVD", "CDA", "D66", "CU"},
    2019: {"VVD", "CDA", "D66", "CU"},
    2020: {"VVD", "CDA", "D66", "CU"},
    2021: {"VVD", "CDA", "D66", "CU"},
    2022: {"VVD", "D66", "CDA", "CU"},
    2023: {"VVD", "D66", "CDA", "CU"},
    2024: {"PVV", "VVD", "NSC", "BBB"},
    2025: {"PVV", "VVD", "NSC", "BBB"},
    2026: {"PVV", "VVD", "NSC", "BBB"},
}

COALITION_NOTE = (
    "2016-2017: Rutte II (VVD/PvdA). "
    "2018-2021: Rutte III (VVD/CDA/D66/CU). "
    "2022-2023: Rutte IV (VVD/D66/CDA/CU). "
    "2024-2026: Schoof (PVV/VVD/NSC/BBB). "
    "2024 ambiguous: Schoof cabinet started July 2024; all 2024 motions are coded "
    "to the Schoof coalition. Coalition effect may be overestimated for early 2024."
)

YEAR_MIN, YEAR_MAX = 2016, 2026
BREAK_YEAR = 2024


def _conn(read_only: bool = True) -> duckdb.DuckDBPyConnection:
    return duckdb.connect(DB_PATH, read_only=read_only)


def cohens_d(x: np.ndarray, y: np.ndarray) -> float:
    """Cohen's d effect size."""
    pooled = np.sqrt((np.var(x, ddof=1) + np.var(y, ddof=1)) / 2)
    if pooled == 0:
        return 0.0
    return (np.mean(y) - np.mean(x)) / pooled


def compute_yearly_rw_metrics(con: duckdb.DuckDBPyConnection) -> dict[int, dict]:
    """Yearly aggregates for classified right-wing motions.

    Joins right_wing_motions with extremity_scores and motions (for pass rate).
    """
    rows = con.execute("""
        SELECT
            r.motion_id,
            r.year,
            r.title,
            r.centrist_support,
            r.right_support,
            r.left_opposition,
            r.category,
            e.text_score AS extremity_score,
            m.voting_results,
            m.winning_margin
        FROM right_wing_motions r
        JOIN extremity_scores e ON r.motion_id = e.motion_id
        JOIN motions m ON r.motion_id = m.id
        WHERE r.classified = TRUE
          AND r.year IS NOT NULL
          AND e.text_score IS NOT NULL
    """).fetchall()

    yearly: dict[int, dict[str, Any]] = {}
    for year in range(YEAR_MIN, YEAR_MAX + 1):
        yearly[year] = {
            "centrist_support": [],
            "right_support": [],
            "left_opposition": [],
            "extremity": [],
            "passed": [],
            "categories": [],
            "titles": [],
            "motion_ids": [],
        }

    for mid, year, title, cs, rs, lo, cat, ext, vr_json, wm in rows:
        if year is None or year < YEAR_MIN or year > YEAR_MAX:
            continue
        yearly[year]["centrist_support"].append(cs if cs is not None else np.nan)
        yearly[year]["right_support"].append(rs if rs is not None else np.nan)
        yearly[year]["left_opposition"].append(lo if lo is not None else np.nan)
        yearly[year]["extremity"].append(ext if ext is not None else np.nan)
        yearly[year]["categories"].append(cat or "other")
        yearly[year]["titles"].append(title or "")
        yearly[year]["motion_ids"].append(mid)

        if vr_json is not None:
            voting = json.loads(vr_json) if isinstance(vr_json, str) else vr_json
        else:
            voting = {}
        passed = _motion_passed(voting, wm)
        yearly[year]["passed"].append(passed)

    return yearly


def compute_yearly_baseline(con: duckdb.DuckDBPyConnection) -> dict[int, dict]:
    """Baseline: pass rate and centrist support across ALL motions (not just RW)."""
    rows = con.execute("""
        SELECT
            m.id AS motion_id,
            EXTRACT(YEAR FROM m.date) AS year,
            m.voting_results,
            m.winning_margin
        FROM motions m
        WHERE m.date IS NOT NULL
    """).fetchall()

    yearly: dict[int, dict] = {}
    for year in range(YEAR_MIN, YEAR_MAX + 1):
        yearly[year] = {"passed": [], "centrist_support": []}

    for mid, year, vr_json, wm in rows:
        if year is None or int(year) < YEAR_MIN or int(year) > YEAR_MAX:
            continue
        year = int(year)
        if vr_json is not None:
            voting = json.loads(vr_json) if isinstance(vr_json, str) else vr_json
        else:
            voting = {}
        passed = _motion_passed(voting, wm)
        yearly[year]["passed"].append(passed)

    centrist_rows = con.execute("""
        SELECT
            mv.motion_id,
            EXTRACT(YEAR FROM mv.date) AS year,
            mv.party,
            COUNT(*) AS n,
            mv.vote
        FROM mp_votes mv
        WHERE mv.party IS NOT NULL
          AND mv.date IS NOT NULL
        GROUP BY mv.motion_id, EXTRACT(YEAR FROM mv.date), mv.party, mv.vote
    """).fetchall()

    motion_party_votes: dict[int, dict[str, dict[str, int]]] = {}
    for mid, year, party, n, vote in centrist_rows:
        year = int(year)
        if year < YEAR_MIN or year > YEAR_MAX:
            continue
        mv = motion_party_votes.setdefault(mid, {})
        pv = mv.setdefault(party, {"voor": 0, "tegen": 0, "afwezig": 0})
        pv[vote] = pv.get(vote, 0) + n

    motion_year_map: dict[int, int] = {}
    for mid, year, _, _, _ in centrist_rows:
        year = int(year)
        if YEAR_MIN <= year <= YEAR_MAX:
            motion_year_map[mid] = year

    for mid, votes in motion_party_votes.items():
        year = motion_year_map.get(mid)
        if year is None:
            continue
        cs = _support_ratio(votes, CANONICAL_CENTRIST_SET)
        if cs is not None:
            yearly[year]["centrist_support"].append(cs)

    return yearly


def _motion_passed(
    voting: dict[str, str], winning_margin: float | None = None
) -> bool | None:
    """Determine if a motion passed from voting_results or winning_margin."""
    if winning_margin is not None:
        return winning_margin > 0
    voor = sum(1 for v in voting.values() if v == "voor")
    tegen = sum(1 for v in voting.values() if v == "tegen")
    if voor + tegen == 0:
        return None
    return voor > tegen


def _support_ratio(
    votes: dict[str, dict[str, int]], parties: set[str]
) -> float | None:
    """Compute support ratio (fraction of parties voting 'voor')."""
    total = 0
    supportive = 0
    for party, pv in votes.items():
        if party not in parties:
            continue
        tv = pv.get("voor", 0) + pv.get("tegen", 0) + pv.get("afwezig", 0)
        if tv == 0:
            continue
        total += 1
        if pv.get("voor", 0) / tv >= 0.5:
            supportive += 1
    if total == 0:
        return None
    return supportive / total


def build_party_name_map(con: duckdb.DuckDBPyConnection) -> dict[str, str]:
    """Build mapping: last name -> party from mp_metadata."""
    rows = con.execute("""
        SELECT mp_name, party, van, tot_en_met
        FROM mp_metadata
        WHERE party IS NOT NULL
        ORDER BY tot_en_met DESC NULLS LAST, van DESC NULLS LAST
    """).fetchall()

    last_to_party: dict[str, str] = {}
    for mp_name, party, _van, _tot in rows:
        last = mp_name.split(",")[0].strip()
        if last not in last_to_party:
            last_to_party[last] = party
    return last_to_party


def parse_lead_submitter(
    title: str, name_party_map: dict[str, str]
) -> tuple[str | None, str | None]:
    """Parse the lead submitter from a motion title and map to party.

    Returns (parsed_name, party) or (None, None).
    """
    if not title:
        return None, None

    patterns = [
        r"(?:Gewijzigde|Nader\s+gewijzigde)?\s*Motie\s+van\s+het\s+lid\s+(.+?)\s+(?:c\.s\.\s+)?over\b",
        r"(?:Gewijzigde|Nader\s+gewijzigde)?\s*Motie\s+van\s+de\s+leden\s+(.+?)\s+(?:c\.s\.\s+)?over\b",
        r"Amendement\s+van\s+het\s+lid\s+(.+?)\s+over\b",
        r"Amendement\s+van\s+de\s+leden\s+(.+?)\s+over\b",
    ]

    for pat in patterns:
        m = re.search(pat, title)
        if m:
            submitter_str = m.group(1).strip()
            parts = submitter_str.split(" en ")
            first_name = parts[0].strip()
            first_name = re.sub(r"\s+c\.s\.", "", first_name).strip()
            if not first_name:
                continue
            party = name_party_map.get(first_name)
            return first_name, party

    return None, None


def compute_opposition_metrics(
    yearly_raw: dict[int, dict], name_party_map: dict[str, str]
) -> dict[int, dict]:
    """Recompute yearly metrics for opposition-only right-wing motions.

    Filters motions where the lead submitter's party is NOT in the coalition.
    """
    opp: dict[int, dict[str, list]] = {}
    for year in range(YEAR_MIN, YEAR_MAX + 1):
        opp[year] = {
            "centrist_support": [],
            "extremity": [],
            "passed": [],
            "n": 0,
        }

    coalition = COALITION

    year_titles_map: dict[int, list[int]] = {}
    for year, d in yearly_raw.items():
        year_titles_map[year] = list(range(len(d["titles"])))

    for year, d in yearly_raw.items():
        coal = coalition.get(year, set())
        for idx in range(len(d["titles"])):
            title = d["titles"][idx]
            submitter_name, submitter_party = parse_lead_submitter(title, name_party_map)

            if submitter_party is None:
                continue

            if submitter_party in coal:
                continue

            opp[year]["centrist_support"].append(d["centrist_support"][idx])
            opp[year]["extremity"].append(d["extremity"][idx])
            opp[year]["passed"].append(d["passed"][idx])
            opp[year]["n"] += 1

    return opp


def compute_domain_metrics(
    yearly_raw: dict[int, dict],
) -> tuple[dict[int, dict], dict[int, dict]]:
    """Split into migration and non-migration domains."""
    mig: dict[int, dict[str, list]] = {}
    non_mig: dict[int, dict[str, list]] = {}

    for year in range(YEAR_MIN, YEAR_MAX + 1):
        mig[year] = {"centrist_support": [], "extremity": [], "passed": [], "n": 0}
        non_mig[year] = {"centrist_support": [], "extremity": [], "passed": [], "n": 0}

    for year, d in yearly_raw.items():
        for idx in range(len(d["titles"])):
            cat = d["categories"][idx]
            target = mig if cat == "asiel/vreemdelingen" else non_mig
            target[year]["centrist_support"].append(d["centrist_support"][idx])
            target[year]["extremity"].append(d["extremity"][idx])
            target[year]["passed"].append(d["passed"][idx])
            target[year]["n"] += 1

    return mig, non_mig


def compute_extremity_stratified(
    yearly_raw: dict[int, dict],
) -> dict[str, dict[str, list]]:
    """Compute pass rate per extremity bucket, pre vs post 2024."""
    buckets = {
        "1-2 (mild)": [],
        "2-3 (moderate)": [],
        "3-4 (high)": [],
        "4-5 (extreme)": [],
    }

    pre_post: dict[str, dict[str, list]] = {
        "pre-2024": {b: [] for b in buckets},
        "post-2024": {b: [] for b in buckets},
    }

    for year, d in yearly_raw.items():
        period = "pre-2024" if year < BREAK_YEAR else "post-2024"
        for idx in range(len(d["titles"])):
            ext = d["extremity"][idx]
            passed = d["passed"][idx]
            if np.isnan(ext) or passed is None:
                continue
            if ext < 2:
                b = "1-2 (mild)"
            elif ext < 3:
                b = "2-3 (moderate)"
            elif ext < 4:
                b = "3-4 (high)"
            else:
                b = "4-5 (extreme)"
            pre_post[period][b].append(passed)

    return pre_post


def yearly_summary(yearly: dict[int, dict]) -> dict[int, dict]:
    """Compute mean values from raw lists."""
    summary: dict[int, dict] = {}
    for year, d in yearly.items():
        s: dict[str, Any] = {}
        for key in ["centrist_support", "right_support", "left_opposition", "extremity"]:
            vals = [v for v in d.get(key, []) if not (isinstance(v, float) and np.isnan(v))]
            s[f"mean_{key}"] = np.mean(vals) if vals else float("nan")
        passes = [p for p in d.get("passed", []) if p is not None]
        s["pass_rate"] = sum(passes) / len(passes) if passes else float("nan")
        s["n"] = len(d.get("motion_ids", d.get("centrist_support", [])))
        summary[year] = s
    return summary


def sample_audit(yearly_raw: dict[int, dict]) -> list[dict]:
    """Stratified random sample: 5 motions per extremity bucket, 20 total."""
    bucket_motions: dict[str, list[int]] = {
        "1-2 (mild)": [],
        "2-3 (moderate)": [],
        "3-4 (high)": [],
        "4-5 (extreme)": [],
    }

    all_motions: list[dict] = []
    for year, d in yearly_raw.items():
        for idx in range(len(d["titles"])):
            ext = d["extremity"][idx]
            if np.isnan(ext):
                continue
            if ext < 2:
                b = "1-2 (mild)"
            elif ext < 3:
                b = "2-3 (moderate)"
            elif ext < 4:
                b = "3-4 (high)"
            else:
                b = "4-5 (extreme)"
            bucket_motions[b].append(len(all_motions))
            all_motions.append({
                "year": year,
                "title": d["titles"][idx],
                "category": d["categories"][idx],
                "extremity": ext,
            })

    rng = random.Random(42)
    sampled: list[dict] = []
    for bucket_name, indices in bucket_motions.items():
        n_sample = min(5, len(indices))
        chosen = rng.sample(indices, n_sample) if indices else []
        for idx in chosen:
            m = all_motions[idx].copy()
            m["bucket"] = bucket_name
            sampled.append(m)

    sampled.sort(key=lambda x: (x["bucket"], x["extremity"]))
    return sampled


def print_audit(sampled: list[dict]) -> None:
    """Display sampled motions for manual extremity audit."""
    print("\n" + "=" * 80)
    print("  MANUAL EXTREMITY AUDIT")
    print("=" * 80)
    print()
    print("For each motion below, judge whether you agree with the LLM-assigned extremity bucket.")
    print("Also note: does the score reflect stylistic extremity (language) or material impact (policy)?")
    print()

    from itertools import groupby

    for bucket, group in groupby(sampled, key=lambda m: m["bucket"]):
        group_list = list(group)
        print(f"\n--- {bucket} (n={len(group_list)} sampled) ---")
        for i, m in enumerate(group_list, 1):
            title = m["title"][:120]
            print(f"\n  [{i}] Year={m['year']} | Category={m['category']}")
            print(f"      LLM Score: {m['extremity']}")
            print(f"      Title: {title}")
            print(f"      Agree? [Y/N]  Driven by: Language / Policy / Both")

    print("\n" + "=" * 80)
    print("  END OF AUDIT — Record agreement rate and note systematic biases")
    print("=" * 80)


def create_figure_1(
    yearly_sum: dict[int, dict],
    opp_sum: dict[int, dict],
    mig_sum: dict[int, dict],
    non_mig_sum: dict[int, dict],
    baseline_sum: dict[int, dict],
) -> str:
    """Figure 1: Centrist support + Pass rate over time (2 panels)."""
    years = sorted(yearly_sum.keys())
    years_arr = np.array(years)

    def _vals(summary, key):
        return np.array([summary[y].get(key, np.nan) for y in years])

    fig, (ax1, ax2) = plt.subplots(2, 1, figsize=(12, 10), sharex=True)

    colour_all = "grey"
    colour_rw = "#002366"
    colour_opp = "#E53935"
    colour_mig = "#6A1B9A"
    colour_non_mig = "#4CAF50"
    colour_baseline = "#9E9E9E"

    # Panel A: Centrist support
    ax1.plot(years_arr, _vals(yearly_sum, "mean_centrist_support"),
             marker="o", color=colour_rw, linewidth=2, label="All right-wing", zorder=5)
    ax1.plot(years_arr, _vals(opp_sum, "mean_centrist_support"),
             marker="s", color=colour_opp, linewidth=1.5, linestyle="--", label="Opposition-only RW", zorder=4)
    ax1.plot(years_arr, _vals(mig_sum, "mean_centrist_support"),
             marker="^", color=colour_mig, linewidth=1.5, linestyle=":", label="Migration", zorder=3)
    ax1.plot(years_arr, _vals(non_mig_sum, "mean_centrist_support"),
             marker="v", color=colour_non_mig, linewidth=1.5, linestyle="-.", label="Non-migration", zorder=2)
    ax1.plot(years_arr, _vals(baseline_sum, "mean_centrist_support"),
             color=colour_baseline, linewidth=1, linestyle="dashed", alpha=0.7, zorder=1, label="All motions (baseline)")

    ax1.axvline(x=BREAK_YEAR - 0.5, color="black", linestyle=":", alpha=0.5, linewidth=1)
    ax1.annotate("2024", xy=(BREAK_YEAR - 0.3, ax1.get_ylim()[1] * 0.95 if ax1.get_ylim()[1] > 0 else 0.95),
                 fontsize=9, color="black", alpha=0.7)

    ax1.set_ylabel("Mean Centrist Support")
    ax1.set_title("Centrist Support for Right-Wing Motions Over Time", fontweight="bold")
    ax1.legend(loc="lower right", fontsize=8, ncol=2)
    ax1.set_ylim(0, 1.05)
    ax1.grid(True, alpha=0.3)

    # Panel B: Pass rate
    ax2.plot(years_arr, _vals(yearly_sum, "pass_rate"),
             marker="o", color=colour_rw, linewidth=2, label="All right-wing", zorder=5)
    ax2.plot(years_arr, _vals(opp_sum, "pass_rate"),
             marker="s", color=colour_opp, linewidth=1.5, linestyle="--", label="Opposition-only RW", zorder=4)
    ax2.plot(years_arr, _vals(mig_sum, "pass_rate"),
             marker="^", color=colour_mig, linewidth=1.5, linestyle=":", label="Migration", zorder=3)
    ax2.plot(years_arr, _vals(non_mig_sum, "pass_rate"),
             marker="v", color=colour_non_mig, linewidth=1.5, linestyle="-.", label="Non-migration", zorder=2)
    ax2.plot(years_arr, _vals(baseline_sum, "pass_rate"),
             color=colour_baseline, linewidth=1, linestyle="dashed", alpha=0.7, zorder=1, label="All motions (baseline)")

    ax2.axvline(x=BREAK_YEAR - 0.5, color="black", linestyle=":", alpha=0.5, linewidth=1)
    ax2.annotate("2024", xy=(BREAK_YEAR - 0.3, ax2.get_ylim()[1] * 0.95 if ax2.get_ylim()[1] > 0 else 0.95),
                 fontsize=9, color="black", alpha=0.7)

    ax2.set_xlabel("Year")
    ax2.set_ylabel("Pass Rate")
    ax2.set_title("Pass Rate of Right-Wing Motions Over Time", fontweight="bold")
    ax2.legend(loc="lower right", fontsize=8, ncol=2)
    ax2.set_ylim(0, 1.05)
    ax2.grid(True, alpha=0.3)

    ax2.set_xticks(years_arr)
    ax2.set_xticklabels([str(y) for y in years], rotation=45)

    plt.tight_layout()
    path = str(REPORTS_DIR / "breakpoint_figure_1.png")
    fig.savefig(path, dpi=150, bbox_inches="tight")
    plt.close(fig)
    logger.info("Saved Figure 1 to %s", path)
    return path


def create_figure_2(
    yearly_sum: dict[int, dict],
    opp_sum: dict[int, dict],
    mig_sum: dict[int, dict],
    non_mig_sum: dict[int, dict],
    ext_stratified: dict[str, dict[str, list]],
) -> str:
    """Figure 2: Extremity over time + Extremity-stratified pass rate (2 panels)."""
    years = sorted(yearly_sum.keys())
    years_arr = np.array(years)

    def _vals(summary, key):
        return np.array([summary[y].get(key, np.nan) for y in years])

    colour_rw = "#002366"
    colour_opp = "#E53935"
    colour_mig = "#6A1B9A"
    colour_non_mig = "#4CAF50"

    fig, (ax1, ax2) = plt.subplots(1, 2, figsize=(14, 6))

    # Panel C: Mean extremity over time
    ax1.plot(years_arr, _vals(yearly_sum, "mean_extremity"),
             marker="o", color=colour_rw, linewidth=2, label="All right-wing", zorder=5)
    ax1.plot(years_arr, _vals(opp_sum, "mean_extremity"),
             marker="s", color=colour_opp, linewidth=1.5, linestyle="--", label="Opposition-only RW", zorder=4)
    ax1.plot(years_arr, _vals(mig_sum, "mean_extremity"),
             marker="^", color=colour_mig, linewidth=1.5, linestyle=":", label="Migration", zorder=3)
    ax1.plot(years_arr, _vals(non_mig_sum, "mean_extremity"),
             marker="v", color=colour_non_mig, linewidth=1.5, linestyle="-.", label="Non-migration", zorder=2)

    ax1.axvline(x=BREAK_YEAR - 0.5, color="black", linestyle=":", alpha=0.5, linewidth=1)
    ax1.annotate("2024", xy=(BREAK_YEAR - 0.3, ax1.get_ylim()[1] * 0.95 if ax1.get_ylim()[1] > 0 else 4.5),
                 fontsize=9, color="black", alpha=0.7)

    ax1.set_xlabel("Year")
    ax1.set_ylabel("Mean Extremity Score")
    ax1.set_title("Content Extremity Over Time", fontweight="bold")
    ax1.legend(loc="upper left", fontsize=8)
    ax1.grid(True, alpha=0.3)
    ax1.set_xticks(years_arr)
    ax1.set_xticklabels([str(y) for y in years], rotation=45)

    # Panel D: Extremity-stratified pass rate (grouped bars)
    bucket_order = ["1-2 (mild)", "2-3 (moderate)", "3-4 (high)", "4-5 (extreme)"]
    bucket_labels = ["1-2\nmild", "2-3\nmoderate", "3-4\nhigh", "4-5\nextreme"]
    bucket_colours = ["#81C784", "#FFB74D", "#E57373", "#BA68C8"]

    x = np.arange(len(bucket_order))
    width = 0.35

    pre_rates = []
    pre_ns = []
    post_rates = []
    post_ns = []

    for b in bucket_order:
        pre_data = ext_stratified["pre-2024"].get(b, [])
        post_data = ext_stratified["post-2024"].get(b, [])
        pre_rates.append(np.mean(pre_data) if pre_data else 0)
        pre_ns.append(len(pre_data))
        post_rates.append(np.mean(post_data) if post_data else 0)
        post_ns.append(len(post_data))

    bars_pre = ax2.bar(x - width / 2, pre_rates, width, label="Pre-2024 (2016-2023)",
                        color="#90CAF9", edgecolor="black", alpha=0.9)
    bars_post = ax2.bar(x + width / 2, post_rates, width, label="Post-2024 (2024-2026)",
                         color="#1E88E5", edgecolor="black", alpha=0.9)

    for i, (bar, n) in enumerate(zip(bars_pre, pre_ns)):
        ax2.text(bar.get_x() + bar.get_width() / 2, bar.get_height() + 0.01,
                 f"N={n}", ha="center", va="bottom", fontsize=8, fontweight="bold")
    for i, (bar, n) in enumerate(zip(bars_post, post_ns)):
        ax2.text(bar.get_x() + bar.get_width() / 2, bar.get_height() + 0.01,
                 f"N={n}", ha="center", va="bottom", fontsize=8, fontweight="bold")

    ax2.set_xticks(x)
    ax2.set_xticklabels(bucket_labels)
    ax2.set_ylabel("Pass Rate")
    ax2.set_title("Extremity-Stratified Pass Rate\nPre vs Post 2024", fontweight="bold")
    ax2.legend(fontsize=8)
    ax2.set_ylim(0, 1.05)
    ax2.grid(True, alpha=0.3, axis="y")

    plt.tight_layout()
    path = str(REPORTS_DIR / "breakpoint_figure_2.png")
    fig.savefig(path, dpi=150, bbox_inches="tight")
    plt.close(fig)
    logger.info("Saved Figure 2 to %s", path)
    return path


def generate_report(
    yearly_sum: dict[int, dict],
    opp_sum: dict[int, dict],
    mig_sum: dict[int, dict],
    non_mig_sum: dict[int, dict],
    baseline_sum: dict[int, dict],
    ext_stratified: dict[str, dict[str, list]],
    yearly_raw: dict[int, dict],
    opp_raw: dict[int, dict],
    fig1_path: str,
    fig2_path: str,
    audit_sample: list[dict],
    audit_notes: str = "",
) -> str:
    """Generate the breakpoint analysis markdown report."""
    years = sorted(yearly_sum.keys())

    def _val(summary, year, key):
        return summary[year].get(key, np.nan)

    # Pre/post 2024 comparisons
    pre_years = [y for y in years if y < BREAK_YEAR]
    post_years = [y for y in years if y >= BREAK_YEAR]

    # Pooled pre/post values for Cohen's d
    rw_pre_cs = []
    rw_post_cs = []
    rw_pre_pr = []
    rw_post_pr = []
    rw_pre_ext = []
    rw_post_ext = []

    opp_pre_cs = []
    opp_post_cs = []
    opp_pre_pr = []
    opp_post_pr = []
    opp_pre_ext = []
    opp_post_ext = []

    for y, d in yearly_raw.items():
        for idx in range(len(d.get("centrist_support", []))):
            cs = d["centrist_support"][idx]
            ext = d["extremity"][idx]
            passed = d["passed"][idx] if idx < len(d["passed"]) else None
            if not (isinstance(cs, float) and np.isnan(cs)):
                if y < BREAK_YEAR:
                    rw_pre_cs.append(cs)
                else:
                    rw_post_cs.append(cs)
            if not (isinstance(ext, float) and np.isnan(ext)):
                if y < BREAK_YEAR:
                    rw_pre_ext.append(ext)
                else:
                    rw_post_ext.append(ext)
            if passed is not None:
                if y < BREAK_YEAR:
                    rw_pre_pr.append(1.0 if passed else 0.0)
                else:
                    rw_post_pr.append(1.0 if passed else 0.0)

    for y, d in opp_raw.items():
        for idx in range(len(d.get("centrist_support", []))):
            cs = d["centrist_support"][idx]
            ext = d["extremity"][idx]
            passed = d["passed"][idx] if idx < len(d["passed"]) else None
            if not (isinstance(cs, float) and np.isnan(cs)):
                if y < BREAK_YEAR:
                    opp_pre_cs.append(cs)
                else:
                    opp_post_cs.append(cs)
            if not (isinstance(ext, float) and np.isnan(ext)):
                if y < BREAK_YEAR:
                    opp_pre_ext.append(ext)
                else:
                    opp_post_ext.append(ext)
            if passed is not None:
                if y < BREAK_YEAR:
                    opp_pre_pr.append(1.0 if passed else 0.0)
                else:
                    opp_post_pr.append(1.0 if passed else 0.0)

    d_cs = cohens_d(np.array(rw_pre_cs), np.array(rw_post_cs))
    d_pr = cohens_d(np.array(rw_pre_pr), np.array(rw_post_pr))
    d_ext = cohens_d(np.array(rw_pre_ext), np.array(rw_post_ext))

    d_opp_cs = cohens_d(np.array(opp_pre_cs), np.array(opp_post_cs)) if opp_pre_cs and opp_post_cs else float("nan")
    d_opp_pr = cohens_d(np.array(opp_pre_pr), np.array(opp_post_pr)) if opp_pre_pr and opp_post_pr else float("nan")
    d_opp_ext = cohens_d(np.array(opp_pre_ext), np.array(opp_post_ext)) if opp_pre_ext and opp_post_ext else float("nan")

    # Yearly summary table
    yearly_table = "| Year | N (RW) | Centrist Support | Pass Rate | Extremity | Right Support | Left Opp. |\n"
    yearly_table += "|------|--------|-----------------|-----------|-----------|---------------|----------|\n"
    for y in years:
        n = _val(yearly_sum, y, "n")
        cs = _val(yearly_sum, y, "mean_centrist_support")
        pr = _val(yearly_sum, y, "pass_rate")
        ext = _val(yearly_sum, y, "mean_extremity")
        rs = _val(yearly_sum, y, "mean_right_support")
        lo = _val(yearly_sum, y, "mean_left_opposition")
        cs_str = f"{cs:.3f}" if not np.isnan(cs) else "N/A"
        pr_str = f"{pr:.3f}" if not np.isnan(pr) else "N/A"
        ext_str = f"{ext:.2f}" if not np.isnan(ext) else "N/A"
        rs_str = f"{rs:.3f}" if not np.isnan(rs) else "N/A"
        lo_str = f"{lo:.3f}" if not np.isnan(lo) else "N/A"
        yearly_table += f"| {y} | {int(n)} | {cs_str} | {pr_str} | {ext_str} | {rs_str} | {lo_str} |\n"

    # Extremity-stratified table
    bucket_order = ["1-2 (mild)", "2-3 (moderate)", "3-4 (high)", "4-5 (extreme)"]
    ext_table = "| Bucket | Period | N | Pass Rate | Δ (post-pre) |\n"
    ext_table += "|--------|--------|---|-----------|-------------|\n"
    for b in bucket_order:
        pre_data = ext_stratified["pre-2024"].get(b, [])
        post_data = ext_stratified["post-2024"].get(b, [])
        pre_pr = np.mean(pre_data) if pre_data else float("nan")
        post_pr = np.mean(post_data) if post_data else float("nan")
        delta = post_pr - pre_pr if not np.isnan(pre_pr) and not np.isnan(post_pr) else float("nan")
        ext_table += f"| {b} | Pre-2024 | {len(pre_data)} | {pre_pr:.3f} | |\n"
        ext_table += f"| | Post-2024 | {len(post_data)} | {post_pr:.3f} | {delta:+.3f} |\n"

    # Audit table
    audit_table = "| # | Year | Category | LLM Score | Bucket | Agreed? | Driver |\n"
    audit_table += "|---|------|----------|-----------|--------|---------|--------|\n"
    for i, m in enumerate(audit_sample, 1):
        audit_table += f"| {i} | {m['year']} | {m['category']} | {m['extremity']} | {m['bucket']} | | |\n"

    lines = [
        "# Overton Window Breakpoint Analysis",
        "",
        "**Goal:** Quantify the 2024 structural break in centrist support, pass rates,",
        "and content extremity for right-wing motions in the Tweede Kamer.",
        "",
        "**Analysis period:** 2016–2026",
        "**Right-wing parties:** PVV, FVD, JA21, SGP",
        "**Centrist parties:** VVD, D66, CDA, NSC, BBB, CU",
        "**Left parties:** PvdA, GL, SP, PvdD, Volt, DENK, Bij1",
        "",
        "---",
        "",
        "## 1. Yearly Aggregate Metrics (All Right-Wing Motions)",
        "",
        yearly_table,
        "",
        "## 2. Pre/Post 2024 Comparison",
        "",
        f"**Break year:** {BREAK_YEAR}",
        "",
        "### All right-wing motions",
        "",
        f"| Metric | Pre-2024 Mean | Post-2024 Mean | Δ | Cohen's d |",
        f"|--------|--------------|---------------|-----|-----------|",
        f"| Centrist Support | {np.mean(rw_pre_cs):.3f} | {np.mean(rw_post_cs):.3f} | {np.mean(rw_post_cs) - np.mean(rw_pre_cs):+.3f} | {d_cs:+.2f} |",
        f"| Pass Rate | {np.mean(rw_pre_pr):.3f} | {np.mean(rw_post_pr):.3f} | {np.mean(rw_post_pr) - np.mean(rw_pre_pr):+.3f} | {d_pr:+.2f} |",
        f"| Extremity | {np.mean(rw_pre_ext):.2f} | {np.mean(rw_post_ext):.2f} | {np.mean(rw_post_ext) - np.mean(rw_pre_ext):+.2f} | {d_ext:+.2f} |",
        "",
        f"**Interpretation:** Cohen's d values quantify effect sizes (|d| < 0.2 small, 0.5 medium, > 0.8 large).",
        f"These are descriptive, not inferential — with only {len(pre_years)} pre-2024 years and {len(post_years)} post-2024 years, statistical significance is not claimed.",
        "",
        "### Opposition-only right-wing motions",
        "",
        f"| Metric | Pre-2024 Mean | Post-2024 Mean | Δ | Cohen's d | N pre / N post |",
        f"|--------|--------------|---------------|-----|-----------|---------------|",
        f"| Centrist Support | {np.mean(opp_pre_cs):.3f} | {np.mean(opp_post_cs):.3f} | {np.mean(opp_post_cs) - np.mean(opp_pre_cs):+.3f} | {d_opp_cs:+.2f} | {len(opp_pre_cs)} / {len(opp_post_cs)} |",
        f"| Pass Rate | {np.mean(opp_pre_pr):.3f} | {np.mean(opp_post_pr):.3f} | {np.mean(opp_post_pr) - np.mean(opp_pre_pr):+.3f} | {d_opp_pr:+.2f} | {len(opp_pre_pr)} / {len(opp_post_pr)} |",
        f"| Extremity | {np.mean(opp_pre_ext):.2f} | {np.mean(opp_post_ext):.2f} | {np.mean(opp_post_ext) - np.mean(opp_pre_ext):+.2f} | {d_opp_ext:+.2f} | {len(opp_pre_ext)} / {len(opp_post_ext)} |",
        "",
        "**Interpretation gate:** If opposition metrics also rise post-2024, the shift is not",
        "purely coalition-driven. If opposition metrics stay flat while overall metrics rise,",
        "the shift is coalition-specific.",
        "",
        "## 3. Coalition Composition",
        "",
        COALITION_NOTE,
        "",
        "Submitter party is parsed from motion title prefixes",
        "(e.g., \"Motie van het lid Wilders over ...\"). Only the lead submitter's party is",
        "considered. Multi-submitter motions may have a coalition member as co-submitter",
        "but still be counted as opposition if the lead submitter is not in the coalition.",
        "",
        "## 4. Domain Decomposition",
        "",
        "Migration = category `asiel/vreemdelingen`. Non-migration = all other categories.",
        "",
        "| Domain | Pre-2024 Mean CS | Post-2024 Mean CS | Δ CS | Pre-2024 PR | Post-2024 PR | Δ PR |",
        "|--------|-----------------|------------------|------|-------------|-------------|------|",
    ]

    for domain_name, domain_sum in [("Migration", mig_sum), ("Non-migration", non_mig_sum)]:
        pre_cs = np.nanmean([_val(domain_sum, y, "mean_centrist_support") for y in pre_years])
        post_cs = np.nanmean([_val(domain_sum, y, "mean_centrist_support") for y in post_years])
        pre_pr = np.nanmean([_val(domain_sum, y, "pass_rate") for y in pre_years])
        post_pr = np.nanmean([_val(domain_sum, y, "pass_rate") for y in post_years])
        lines.append(
            f"| {domain_name} | {pre_cs:.3f} | {post_cs:.3f} | {post_cs - pre_cs:+.3f} | "
            f"{pre_pr:.3f} | {post_pr:.3f} | {post_pr - pre_pr:+.3f} |"
        )

    lines += [
        "",
        "## 5. Extremity-Stratified Pass Rate",
        "",
        ext_table,
        "",
        "**Key test:** If high-extremity motions (3–5) went from low pass rate to high pass rate",
        "while mild motions stayed flat, centrists are more tolerant of extreme content —",
        "direct Overton shift evidence. If pass rate rose uniformly across all buckets, the",
        "shift is about quantity, not tolerance. If only the 1–2 bucket rose, right-wing",
        "parties filed milder motions post-2024 and the 'shift' is illusory.",
        "",
        "## 6. Manual Extremity Audit",
        "",
        audit_notes,
        "",
        audit_table,
        "",
        "## 7. Limitations",
        "",
        "- **Small-N time series:** 8 pre-2024 years and at most 3 post-2024 years (2026 is partial).",
        "   Effect sizes are descriptive, not confirmatory.",
        "- **LLM extremity scores:** Content-based, not independently validated beyond the",
        "   manual audit above. See §6 for agreement rate and noted biases.",
        "- **Coalition composition:** Hardcoded per year. 2024 is ambiguous (Rutte IV until July,",
        "   Schoof thereafter). Early 2024 motions may be miscoded as Schoof-era.",
        "- **Submitter party identification:** Parsed from motion title prefixes (e.g.,",
        "   'Motie van het lid X'). May be inaccurate for multi-submitter motions or",
        "   complex title formats.",
        "- **Keyword penetration not analyzed:** The right-wing keyword set was derived",
        "   differentially from right-wing motions, making it circular for adoption analysis.",
        "- **Pass rate baseline:** Computed across all motions with voting data. Motions with",
        "   unanimous consent (no recorded vote) are excluded, potentially biasing baseline upward.",
        "",
        "## 8. Figures",
        "",
        f"![Figure 1: Centrist Support and Pass Rate]({Path(fig1_path).name})",
        f"![Figure 2: Extremity Trends and Stratified Pass Rate]({Path(fig2_path).name})",
        "",
        "## 9. Conclusion",
        "",
        "*(Fill in after reviewing all indicators and audit results.)*",
    ]

    report_path = REPORTS_DIR / "breakpoint_analysis.md"
    with open(report_path, "w") as f:
        f.write("\n".join(lines))
    logger.info("Report written to %s", report_path)
    return str(report_path)


def main() -> int:
    logger.info("Connecting to database: %s", DB_PATH)
    con = _conn(read_only=True)

    logger.info("Computing yearly right-wing metrics...")
    yearly_raw = compute_yearly_rw_metrics(con)

    logger.info("Computing baseline (all motions) metrics...")
    baseline_raw = compute_yearly_baseline(con)

    logger.info("Building party name map from mp_metadata...")
    name_party_map = build_party_name_map(con)

    logger.info("Computing opposition-only metrics...")
    opp_raw = compute_opposition_metrics(yearly_raw, name_party_map)

    logger.info("Computing domain decomposition...")
    mig_raw, non_mig_raw = compute_domain_metrics(yearly_raw)

    logger.info("Computing extremity-stratified pass rates...")
    ext_stratified = compute_extremity_stratified(yearly_raw)

    con.close()

    yearly_sum = yearly_summary(yearly_raw)
    opp_sum = yearly_summary(opp_raw)
    mig_sum = yearly_summary(mig_raw)
    non_mig_sum = yearly_summary(non_mig_raw)
    baseline_sum = yearly_summary(baseline_raw)

    logger.info("Generating Figure 1...")
    fig1_path = create_figure_1(yearly_sum, opp_sum, mig_sum, non_mig_sum, baseline_sum)

    logger.info("Generating Figure 2...")
    fig2_path = create_figure_2(yearly_sum, opp_sum, mig_sum, non_mig_sum, ext_stratified)

    logger.info("Sampling motions for manual audit...")
    audit_sample = sample_audit(yearly_raw)
    print_audit(audit_sample)

    logger.info("Generating report...")
    audit_notes = (
        "**Audit notes:** Perform manual audit by reviewing the motions below. "
        "Record agreement per motion. Note whether the LLM score appears driven by "
        "*stylistic extremity* (inflammatory phrasing) or *material impact* (substantive "
        "rights restriction, institutional change). "
        "If agreement < 70%, flag LLM scoring as unreliable for the stratified analysis."
    )

    report_path = generate_report(
        yearly_sum=yearly_sum,
        opp_sum=opp_sum,
        mig_sum=mig_sum,
        non_mig_sum=non_mig_sum,
        baseline_sum=baseline_sum,
        ext_stratified=ext_stratified,
        yearly_raw=yearly_raw,
        opp_raw=opp_raw,
        fig1_path=fig1_path,
        fig2_path=fig2_path,
        audit_sample=audit_sample,
        audit_notes=audit_notes,
    )

    print(f"\nReport: {report_path}")
    print(f"Figure 1: {fig1_path}")
    print(f"Figure 2: {fig2_path}")
    return 0


if __name__ == "__main__":
    raise SystemExit(main())