AUTODIAL · zhechengyin · Jun 19, 2025 · Jul 17, 2025 · Jul 22, 2025 · Jul 22, 2025
diff --git a/examples/basic_workflow.ipynb b/examples/basic_workflow.ipynb
diff --git a/examples/helper_function/evaluate_posterior_distribution.py b/examples/helper_function/evaluate_posterior_distribution.py
@@ -0,0 +1,146 @@
+import os
+import math
+import numpy as np
+import matplotlib.pyplot as plt
+from scipy.stats import probplot, gaussian_kde
+from sklearn.linear_model import LinearRegression
+
+
+# ---------- Peak-finding helpers ----------
+def suppress_close_peaks(idx_sorted, window):
+    kept = []
+    for i in idx_sorted:
+        if all(abs(i - j) >= window for j in kept):
+            kept.append(i)
+    return sorted(kept)
+
+
+def detect_peaks(x, y, alpha=6e-5, height_ratio=0.5, tol=1e-3, debug=False):
+    """Return (indices, coords) of peaks that satisfy height + consensus."""
-def detect_peaks(x, y, alpha=6e-5, height_ratio=0.5, tol=1e-3, debug=False):
-    """Return (indices, coords) of peaks that satisfy height + consensus."""
+def detect_peaks(x, y, alpha=DEFAULT_ALPHA, height_ratio=0.5, tol=1e-3, debug=False):
+    """
+    Return (indices, coords) of peaks that satisfy height + consensus.
+    
+    Parameters:
+        x (array-like): The x-coordinates of the data points.
+        y (array-like): The y-coordinates of the data points.
+        alpha (float): Threshold scaling factor for peak detection. Default is 6e-5.
+        height_ratio (float): Minimum height ratio for peak filtering. Default is 0.5.
+        tol (float): Tolerance for consensus voting. Default is 1e-3.
+        debug (bool): If True, prints debug information. Default is False.
+    
+    Returns:
+        tuple: Indices and coordinates of detected peaks.
+    """
-def detect_peaks(x, y, alpha=6e-5, height_ratio=0.5, tol=1e-3, debug=False):
-    """Return (indices, coords) of peaks that satisfy height + consensus."""
+def detect_peaks(x, y, alpha=DEFAULT_ALPHA, height_ratio=0.5, tol=1e-3, debug=False):
+    """
+    Return (indices, coords) of peaks that satisfy height + consensus.
+    
+    Parameters:
+        x (array-like): The x-coordinates of the data points.
+        y (array-like): The y-coordinates of the data points.
+        alpha (float): Threshold scaling factor for peak detection. Default is 6e-5.
+        height_ratio (float): Minimum height ratio for peak filtering. Default is 0.5.
+        tol (float): Tolerance for consensus voting. Default is 1e-3.
+        debug (bool): If True, prints debug information. Default is False.
+    
+    Returns:
+        tuple: Indices and coordinates of detected peaks.
+    """
+    def apply_method(method):
+        if method == "range":
+            thr = alpha * (y.max() - y.min())
+        elif method == "std":
+            thr = alpha * y.std()
+        elif method == "iqr":
+            q1, q3 = np.percentile(y, [25, 75])
+            thr = alpha * (q3 - q1)
+        else:
+            raise ValueError
+        peaks = [
+            (i, x[i], y[i])
+            for i in range(1, len(y) - 1)
+            if y[i] > y[i - 1] and y[i] > y[i + 1] and y[i] - min(y[i - 1], y[i + 1]) > thr
+        ]
+        return peaks
+
+    methods = ["range", "std", "iqr"]
+    peak_sets = [set(apply_method(m)) for m in methods]
+
+    # ── consensus voting (≥2 methods) ─────────────────────────
+    consensus = {
+        (idx, px, py)
+        for idx, px, py in peak_sets[0]
+        if sum(any(abs(px - px2) < tol for _, px2, _ in s) for s in peak_sets) >= 2
+    }
+
+    # ── height filter ─────────────────────────────────────────
+    y_max = y.max()
+    height_thr = height_ratio * y_max
+    cand = [(idx, px, py) for idx, px, py in consensus if py >= height_thr]
+    if debug:
+        for _, px, py in cand:
+            print(f"  peak@{px:.4g}  height={py:.4g}  thr={height_thr:.4g}")
+
+    if not cand:
+        return [], []
+
+    # ── non-max suppression ───────────────────────────────────
+    dx = np.median(np.diff(np.sort(x)))
+    bw = 1.06 * y.std() * len(x) ** (-1 / 5)
+    window_pts = round((0.4 * bw) / dx)  # Same formula originally used
+    idx_sorted = [idx for idx, *_ in sorted(cand, key=lambda p: p[2], reverse=True)]
+    idx_keep = suppress_close_peaks(idx_sorted, window_pts)
+
+    peaks_coord = [(float(x[i]), float(y[i])) for i in idx_keep]
+    return idx_keep, peaks_coord
+
+
+def skewness(sample):
+    m2 = np.mean((sample - sample.mean()) ** 2)
+    m3 = np.mean((sample - sample.mean()) ** 3)
+    return 0.0 if m2 == 0 else round(m3 / m2 ** 1.5, 4)
+
+
+# ---------- main ----------
+def evaluate_posterior_distribution(
+    mcmc,
+    threshold=79,
+    save_plot=False,
+    save_dir="figures",
+    height_ratio=0.5,
+    debug=False,
+):
+    def score_one(sample):
+        (t, q), _ = probplot(sample, dist="norm")
+        r2 = LinearRegression().fit(t[:, None], q[:, None]).score(t[:, None], q[:, None])
+        sk = skewness(sample)
+
+        x = np.linspace(sample.min(), sample.max(), 600)  # finer grid
+        y = gaussian_kde(sample)(x)
+        idx, coords = detect_peaks(x, y, height_ratio=height_ratio, debug=debug)
+        modes = len(idx)
+    # Constants for scoring formula
+    R2_WEIGHT = 100  # Weight for R² (goodness of fit)
+    SKEWNESS_PENALTY = 5  # Penalty for absolute skewness
+    MODES_PENALTY = 9  # Penalty for the number of modes
+
+        score = r2 * R2_WEIGHT - abs(sk) * SKEWNESS_PENALTY - modes * MODES_PENALTY
+        return max(0, round(score, 2)), r2, sk, modes, x, y, coords
+
+    def save_plot_func(label, sample, x, y, peaks, skew, score, r2, cat1, cat2):
+        os.makedirs(os.path.join(save_dir, cat1, cat2), exist_ok=True)
+        plt.figure(figsize=(8, 6))
+        plt.subplot(2, 1, 1)
+        plt.plot(x, y, label="KDE")
+        if peaks:
+            px, py = zip(*peaks)
+            plt.scatter(px, py, color="red", s=80, marker="x")
+        plt.title(f"{label} KDE | Score:{score} | R²:{r2:.3f} | Skew:{skew:.3f}")
+        plt.legend()
+        plt.subplot(2, 1, 2)
+        plt.hist(sample, bins=30, edgecolor="black")
+        plt.tight_layout()
+        plt.savefig(os.path.join(save_dir, cat1, cat2, f"{label}-{score}.png"))
+        plt.close()
+
+    total_score, bad_params = 0, []
+
+    for name, chain in mcmc.get_samples().items():
+        if name in ("lp__", "log_likelihood"):
+            continue
+
+        sample = np.asarray(chain)
+        score, r2, sk, modes, x, y, peaks = score_one(sample)
+        total_score += score
+        if score < threshold:
+            bad_params.append(name)
+
+        if save_plot:
+            if math.isnan(sk):
+                cat1 = "Invalid"
+            elif abs(sk) >= 2:
+                cat1 = "Touch-Bound"
+            elif modes > 1:
+                cat1 = "Multi-Peak"
+            elif sk < -0.5:
+                cat1 = "Right-Skewed"
+            elif sk > 0.5:
+                cat1 = "Left-Skewed"
+            else:
+                cat1 = "Normal"
+            cat2 = "Good" if score >= threshold else "Bad"
+            save_plot_func(name, sample, x, y, peaks, sk, score, r2, cat1, cat2)
+
+
+    return total_score, bad_params
diff --git a/examples/helper_function/update_circuits_info.py b/examples/helper_function/update_circuits_info.py
@@ -0,0 +1,85 @@
+import numpy as np
+import autoeis as ae
+
+def update_circuits_with_posterior_scores(
+    circuits_df,
+    results,
+    freq,
+    Z,
+    score_fn,
+    threshold=79,
+    save_plot=True,
+    verbose=True
+):
+    """
+    Integrate posterior quality evaluation into circuits DataFrame.
+
+    Args:
+        circuits_df (pd.DataFrame): Original circuits table.
+        results (list): List of AutoEIS InferenceResult.
+        freq (np.ndarray): Frequency array.
+        Z (np.ndarray): Impedance data.
+        score_fn (callable): Your posterior scoring function, should return (total_score, bad_param_list).
+        threshold (int): Score threshold for bad parameter filtering.
+        save_plot (bool): Whether to generate KDE/histogram plots.
+        verbose (bool): Whether to print per-circuit result.
+
+    Returns:
+        pd.DataFrame: Updated circuits DataFrame.
+    """
+    scores = []
+    bad_params_all = []
+
+    if verbose:
+        print("Evaluating posterior distributions...\n")
+
+    for result in results:
+        if result.converged:
+            if verbose:
+                ae.visualization.print_summary_statistics(result.mcmc, result.circuit)
+
+            total_score, bad_params = score_fn(
+                result.mcmc, threshold=threshold, save_plot=save_plot
+            )
+
+            if verbose:
+                print(f"Circuit: {result.circuit}")
+                print(f"Score: {total_score:.2f}")
+                print(f"Bad parameters: {bad_params if bad_params else 'None'}\n")
+        else:
+            total_score, bad_params = 0, ["Not Converged"]
+            if verbose:
+                print(f"Circuit {result.circuit} did not converge.\n")
+
+        scores.append(total_score)
+        bad_params_all.append(", ".join(bad_params) if bad_params else "None")
+
+    # ---------- Write inference results to new DataFrame columns ----------
+    circuits_df = circuits_df.copy()
+    circuits_df["InferenceResult"] = results
+    circuits_df["Posterior Score"] = scores
+    circuits_df["Bad Parameters"] = bad_params_all
+
+    # ---------- Compute fitness metrics using AutoEIS ----------
+    circuits_df = ae.core.compute_fitness_metrics(circuits_df, freq, Z)
+
+    # ---------- Custom ranking logic ----------
+    # True if the circuit contains bad parameters, False otherwise
+    circuits_df["HasBad"] = circuits_df["Bad Parameters"].str.strip().str.lower() != "none"
+
+    # Sort so that circuits without bad parameters come first,
+    # and within each group, sort by Posterior Score (descending)
+    circuits_df.sort_values(
+        by=["HasBad", "Posterior Score"],
+        ascending=[True, False],
+        inplace=True,
+        ignore_index=True
+    )
+
+    # Assign consecutive ranks: 1, 2, 3, ...
+    circuits_df["Posterior Score Rank"] = np.arange(1, len(circuits_df) + 1)
+
+    # Optional: Remove the helper column
+    circuits_df.drop(columns=["HasBad"], inplace=True)
+
+    return circuits_df
diff --git a/src/autoeis/visualization.py b/src/autoeis/visualization.py
@@ -416,30 +416,37 @@ def print_inference_results(circuits: pd.DataFrame, return_table=True) -> Styler
     # Add columns to the table
     columns = [
         "Circuit",
-        "WAIC (real)" if "WAIC (real)" in circuits.columns else "WAIC (mag)",
-        "WAIC (imag)" if "WAIC (imag)" in circuits.columns else "WAIC (phase)",
+        "WAIC (mag)" if "WAIC (mag)" in circuits.columns else "WAIC (real)",
+        "WAIC (phase)" if "WAIC (phase)" in circuits.columns else "WAIC (imag)",
         "R2 (re)",
         "R2 (im)",
         "MAPE (re)",
         "MAPE (im)",
         "Np",
+        "Posterior Score",
+        "Posterior Score Rank",
+        "Bad Parameters",
     ]
+
     for column in columns:
         table.add_column(column, justify="right")
 
     # Fill the table with data
     for i, row in df.data.iterrows():
         table.add_row(
             row["circuitstring"],
-            f"{row['WAIC (real)' if 'WAIC (real)' in circuits.columns else 'WAIC (mag)']:.2e}",
-            f"{row['WAIC (imag)' if 'WAIC (imag)' in circuits.columns else 'WAIC (phase)']:.2e}",
+            f"{row['WAIC (mag)' if 'WAIC (mag)' in circuits.columns else 'WAIC (real)']:.2e}",
+            f"{row['WAIC (phase)' if 'WAIC (phase)' in circuits.columns else 'WAIC (imag)']:.2e}",
             f"{row['R^2 (ravg)']:.3f}",
             f"{row['R^2 (iavg)']:.3f}",
             f"{row['MAPE (ravg)']:.2e}",
             f"{row['MAPE (iavg)']:.2e}",
             f"{row['n_params']}",
+            f"{row['Posterior Score']:.2f}",
+            str(row['Posterior Score Rank']),
+            row['Bad Parameters'],
         )
-
+        
     return table if return_table else df