albertbuchard · May 25, 2025 01:20 · albertbuchard · May 25, 2025
diff --git a/entropy_balanced_ipaw.py b/entropy_balanced_ipaw.py

 import numpy as np
 import pandas as pd
 import cvxpy as cp
 from typing import Sequence, Union


 def entropy_balance_ipaw(
    df: pd.DataFrame,
    *,
    baseline_covariates: Union[Sequence[str], None] = None,
    base_weight_col: str = "ipaw_true",
    session_col: str = "session",
    baseline_session: int = 1,
    ridge: float = 1e-3,  # L₂ penalty on imbalance
    out_col: str = "ipaw_ebal",
    solver: str = "ECOS",
 ) -> pd.DataFrame:
    """
    Ridge-penalised entropy balancing of existing IPAW weights.
    Guarantees finite, non-negative weights and never returns NaN.

    Objective (per session s ≠ baseline):
        minimise   Σ_i KL(w_i || w0_i) + ridge · || Zᵀ w − μ₀ Σ w0 ||²
    subject to    Σ_i w_i = Σ_i w0_i
                  w_i ≥ 1e-8 · mean(w0)      (numeric lower bound)
    """
    if baseline_covariates is None:
        baseline_covariates = ("age", "sex")

    df = df.copy()

    # baseline (session = baseline_session) means
    mu0 = (
        df.loc[df[session_col] == baseline_session, baseline_covariates]
        .mean()
        .to_numpy()
    )

    new_w = np.empty(len(df), dtype=float)

    for s, g in df.groupby(session_col, sort=True):
        idx = g.index
        w0 = g[base_weight_col].to_numpy()

        # keep baseline weights unchanged
        if s == baseline_session:
            new_w[idx] = w0
            continue

        Z = g[list(baseline_covariates)].to_numpy(float)
        n = len(w0)

        # numeric lower bound prevents under-flow when w0 is very small
        lb = 1e-8 * w0.mean()

        w = cp.Variable(n, nonneg=True)
        imbalance = Z.T @ w - mu0 * w0.sum()
        obj = cp.Minimize(
            cp.sum(cp.rel_entr(w, w0)) + ridge * cp.sum_squares(imbalance)
        )
        constraints = [cp.sum(w) == w0.sum(), w >= lb]

        prob = cp.Problem(obj, constraints)

        prob.solve(solver=solver, verbose=False)

        # ── graceful fall-backs ────────────────────────────────────────
        if prob.status not in ("optimal", "optimal_inaccurate") or w.value is None:
            new_w[idx] = w0
            continue

        # OPTIONAL: rerun with exact equality when the ridge solution
        # already hits the constraints up to machine precision
        if imbalance.value is not None and np.linalg.norm(imbalance.value) < 1e-10:
            constraints[0] = Z.T @ w == mu0 * w0.sum()
            prob_eq = cp.Problem(cp.Minimize(cp.sum(cp.rel_entr(w, w0))), constraints)
            prob_eq.solve(solver=solver, verbose=False)
            if (
                prob_eq.status in ("optimal", "optimal_inaccurate")
                and w.value is not None
            ):
                new_w[idx] = w.value
                continue

        new_w[idx] = w.value

    df[out_col] = new_w
    return df

	import numpy as np
	import pandas as pd
	import cvxpy as cp
	from typing import Sequence, Union


	def entropy_balance_ipaw(
	df: pd.DataFrame,
	*,
	baseline_covariates: Union[Sequence[str], None] = None,
	base_weight_col: str = "ipaw_true",
	session_col: str = "session",
	baseline_session: int = 1,
	ridge: float = 1e-3, # L₂ penalty on imbalance
	out_col: str = "ipaw_ebal",
	solver: str = "ECOS",
	) -> pd.DataFrame:
	"""
	Ridge-penalised entropy balancing of existing IPAW weights.
	Guarantees finite, non-negative weights and never returns NaN.

	Objective (per session s ≠ baseline):
	minimise Σ_i KL(w_i \|\| w0_i) + ridge · \|\| Zᵀ w − μ₀ Σ w0 \|\|²
	subject to Σ_i w_i = Σ_i w0_i
	w_i ≥ 1e-8 · mean(w0) (numeric lower bound)
	"""
	if baseline_covariates is None:
	baseline_covariates = ("age", "sex")

	df = df.copy()

	# baseline (session = baseline_session) means
	mu0 = (
	df.loc[df[session_col] == baseline_session, baseline_covariates]
	.mean()
	.to_numpy()
	)

	new_w = np.empty(len(df), dtype=float)

	for s, g in df.groupby(session_col, sort=True):
	idx = g.index
	w0 = g[base_weight_col].to_numpy()

	# keep baseline weights unchanged
	if s == baseline_session:
	new_w[idx] = w0
	continue

	Z = g[list(baseline_covariates)].to_numpy(float)
	n = len(w0)

	# numeric lower bound prevents under-flow when w0 is very small
	lb = 1e-8 * w0.mean()

	w = cp.Variable(n, nonneg=True)
	imbalance = Z.T @ w - mu0 * w0.sum()
	obj = cp.Minimize(
	cp.sum(cp.rel_entr(w, w0)) + ridge * cp.sum_squares(imbalance)
	)
	constraints = [cp.sum(w) == w0.sum(), w >= lb]

	prob = cp.Problem(obj, constraints)

	prob.solve(solver=solver, verbose=False)

	# ── graceful fall-backs ────────────────────────────────────────
	if prob.status not in ("optimal", "optimal_inaccurate") or w.value is None:
	new_w[idx] = w0
	continue

	# OPTIONAL: rerun with exact equality when the ridge solution
	# already hits the constraints up to machine precision
	if imbalance.value is not None and np.linalg.norm(imbalance.value) < 1e-10:
	constraints[0] = Z.T @ w == mu0 * w0.sum()
	prob_eq = cp.Problem(cp.Minimize(cp.sum(cp.rel_entr(w, w0))), constraints)
	prob_eq.solve(solver=solver, verbose=False)
	if (
	prob_eq.status in ("optimal", "optimal_inaccurate")
	and w.value is not None
	):
	new_w[idx] = w.value
	continue

	new_w[idx] = w.value

	df[out_col] = new_w
	return df
Scenario	Why Bias Can Creep Back In
Balance only on a subset $L_{\text{sub}} < L$	If `baseline_covariates` is only a subset of the original $L$, the calibration might improve balance on $L_{\text{sub}}$ but worsen it for the remaining confounders in $L \setminus L_{\text{sub}}$. Exchangeability based on the full $L$ is no longer guaranteed.
Add balancing constraints on variables $X \not\in L$	✦ If $X$ is not a confounder: No new bias, but potentially increased variance. ✦ If $X$ is a hidden confounder (missed by original $L$): This could be beneficial by effectively upgrading $L$. ✦ If aggressive re-weighting occurs for $X$: May violate positivity or inflate variance.
Use outcome/post-baseline variables in `baseline_covariates`	This directly breaks the backdoor block. The weights would now depend on variables affected by attrition or on the causal pathway to the outcome.
Original $w^{(0)}$ from a severely misspecified attrition model	If $L$ was incomplete in the first place, $w^{(0)}$ never fully blocked backdoor paths. Entropy balancing can't fix this underlying omitted variable bias; it might only redistribute existing bias.