# ── SECTION 1: LOAD CHECKPOINT ───────────────────────────────────────────────

import pandas as pd
import joblib
import shap
import numpy as np
from scipy import stats
from sklearn.preprocessing import LabelEncoder
from scipy.stats import ks_2samp
from fairlearn.metrics import demographic_parity_difference, equalized_odds_difference
from sklearn.metrics import matthews_corrcoef, log_loss, confusion_matrix, precision_recall_curve, auc, confusion_matrix
import matplotlib.pyplot as plt
import seaborn as sns
bins_proxy   = [-np.inf, 0.0, 50397.0, np.inf]
labels_proxy = ['Low-Balance', 'Mid-Balance', 'High-Balance']

df = pd.read_csv('checkpoint.csv')

print(f'Checkpoint loaded: {df.shape[0]:,} rows x {df.shape[1]} columns')
print(df.columns.tolist())

Checkpoint loaded: 6,362,620 rows x 11 columns
['step', 'type', 'amount', 'nameOrig', 'oldbalanceOrg', 'newbalanceOrig', 'nameDest', 'oldbalanceDest', 'newbalanceDest', 'isFraud', 'isFlaggedFraud']

model = joblib.load("xgb_model.pkl")

X_test = pd.read_csv('X_test.csv')
y_test = pd.read_csv('y_test.csv')
results = pd.read_csv('model_results.csv')

s_test = results[['balance_group', 'tx_type_group']].astype(str)

print("Model + data loaded")
print(X_test.shape)

Model + data loaded
(1272524, 6)

FEATURES = [
    'step', 'amount', 'oldbalanceOrg', 'newbalanceOrig',
    'oldbalanceDest', 'newbalanceDest'
]

# ── SECTION 10: EXPLAINABILITY — SHAP ────────────────────────────────────────
print('Computing SHAP values on a sample of 2,000 test transactions...')
print('A sample is used because full-dataset SHAP on 1.27M rows would take hours.')
print('2,000 is statistically representative for feature importance analysis.\n')

shap_idx    = np.random.choice(len(X_test), 2000, replace=False)
X_shap      = X_test.iloc[shap_idx]
s_shap      = s_test.iloc[shap_idx]

explainer   = shap.TreeExplainer(model)
shap_values = explainer.shap_values(X_shap)

mean_shap = np.abs(shap_values).mean(axis=0)
top5_idx  = np.argsort(mean_shap)[::-1][:5]
top5_feat = [FEATURES[i] for i in top5_idx]

print('Top 5 most influential features:')
for i, fi in enumerate(top5_idx):
    print(f'  {i+1}. {FEATURES[fi]:<30} mean absolute SHAP = {mean_shap[fi]:.4f}')

explanations = {
    'amount_to_orig_balance': 'Fraction of account balance being moved. A fraudster draining a full account sends this ratio close to 1.0. NOTE: This feature is correlated with balance tier — see risk note in Section 5.',
    'balance_diff_orig':      'How much the sender balance dropped. A complete drain is a red flag.',
    'orig_balance_zeroed':    'Whether the sender account hit exactly zero. The clearest fraud signature in the data.',
    'step':                   'Time step of the transaction. Fraud clusters at specific hours.',
    'amount':                 'Raw transaction size. Very large amounts carry elevated fraud risk.',
    'balance_diff_dest':      'How much the destination balance changed. Unusually large inflows to empty accounts are suspect.',
    'hour_of_day':            'Hour of day derived from step. Temporal fraud patterns.',
    'day_of_week':            'Day of week derived from step. Weekly fraud patterns.',
    'dest_balance_zeroed':    'Whether the destination account was empty before receiving the transfer.',
    'newbalanceOrig':         'Sender balance after transaction.',
    'oldbalanceOrg':          'Sender balance before transaction.',
}

print('\nWhat each feature represents:')
for feat in top5_feat:
    if feat in explanations:
        print(f'\n  {feat}:')
        print(f'    {explanations[feat]}')

Computing SHAP values on a sample of 2,000 test transactions...
A sample is used because full-dataset SHAP on 1.27M rows would take hours.
2,000 is statistically representative for feature importance analysis.

Top 5 most influential features:
  1. newbalanceOrig                 mean absolute SHAP = 5.2540
  2. oldbalanceOrg                  mean absolute SHAP = 4.9669
  3. amount                         mean absolute SHAP = 2.2655
  4. step                           mean absolute SHAP = 0.7908
  5. oldbalanceDest                 mean absolute SHAP = 0.5503

What each feature represents:

  newbalanceOrig:
    Sender balance after transaction.

  oldbalanceOrg:
    Sender balance before transaction.

  amount:
    Raw transaction size. Very large amounts carry elevated fraud risk.

  step:
    Time step of the transaction. Fraud clusters at specific hours.

# ── SECTION 10: SHAP GLOBAL BAR CHART ────────────────────────────────────────
plt.figure(figsize=(10, 6))
shap.summary_plot(shap_values, X_shap, feature_names=FEATURES,
                  plot_type='bar', show=False)
plt.title(
    'SHAP Global Feature Importance\n'
    'Average absolute SHAP value — which features drive predictions most?\n'
    'ClearBoxAI Audit CBA-2026-002',
    fontsize=11, fontweight='bold', pad=15
)
plt.tight_layout()
plt.savefig('fig_shap_01_bar.png', dpi=150, bbox_inches='tight')
plt.show()

print('How to read this chart:')
print('  Longer bar = feature had more influence on predictions overall.')
print('  This is averaged across all 2,000 sampled test transactions.')

How to read this chart:
  Longer bar = feature had more influence on predictions overall.
  This is averaged across all 2,000 sampled test transactions.

# ── SECTION 10: SHAP BEESWARM ─────────────────────────────────────────────────
plt.figure(figsize=(10, 8))
shap.summary_plot(shap_values, X_shap, feature_names=FEATURES,
                  show=False, max_display=10)
plt.title(
    'SHAP Beeswarm — Feature Impact for Each Individual Transaction\n'
    'Red = high feature value pushed toward fraud | Blue = low pushed toward legitimate\n'
    'ClearBoxAI Audit CBA-2026-002',
    fontsize=10, fontweight='bold', pad=15
)
plt.tight_layout()
plt.savefig('fig_shap_02_beeswarm.png', dpi=150, bbox_inches='tight')
plt.show()

print('How to read this chart:')
print('  Each dot is one transaction.')
print('  Right side of x-axis = pushed toward fraud.')
print('  Left side = pushed toward legitimate.')
print('  Color: red = high feature value, blue = low feature value.')

How to read this chart:
  Each dot is one transaction.
  Right side of x-axis = pushed toward fraud.
  Left side = pushed toward legitimate.
  Color: red = high feature value, blue = low feature value.

# ── SECTION 10: SHAP PROXY SCATTER ────────────────────────────────────────────
fig, axes = plt.subplots(1, 3, figsize=(16, 5))
fig.suptitle(
    'SHAP Proxy Scatter — Does the Model Behave Differently by Transaction Type?\n'
    'Each dot is one transaction. CASH_OUT (red) vs OTHER (teal)\n'
    'ClearBoxAI Audit CBA-2026-002',
    fontsize=10, fontweight='bold'
)

type_colors = {'CASH_OUT': '#FF6B6B', 'OTHER': '#4ECDC4'}
type_labels = s_shap['tx_type_group'].astype(str).values

for ax, feat in zip(axes, top5_feat[:3]):
    feat_idx  = FEATURES.index(feat)
    feat_vals = X_shap[feat].values
    shap_feat = shap_values[:, feat_idx]

    for g, c in type_colors.items():
        mask = type_labels == g
        ax.scatter(feat_vals[mask], shap_feat[mask],
                   color=c, alpha=0.25, s=6, label=g)

    ax.axhline(0, color='black', lw=0.8, linestyle='--')
    ax.set_xlabel(feat, fontsize=9)
    ax.set_ylabel('SHAP value' if ax == axes[0] else '')
    ax.set_title(feat, fontsize=9, fontweight='bold')
    ax.legend(title='tx_type_group', markerscale=3, fontsize=8)

plt.tight_layout()
plt.savefig('fig_shap_03_proxy_scatter.png', dpi=150, bbox_inches='tight')
plt.show()

print('How to read these charts:')
print('  If red and teal dots overlap, the model treats both groups similarly for that feature.')
print('  If they cluster separately, the model uses the feature differently by group.')

How to read these charts:
  If red and teal dots overlap, the model treats both groups similarly for that feature.
  If they cluster separately, the model uses the feature differently by group.

df.to_csv('checkpoint_v2.csv', index=False)
print("Checkpoint v2 saved.")

Checkpoint v2 saved.

Regulation	Provision	Status
BoG CISD 2026, Annexure E §j(i)	SHAP mandated as acceptable explainability technique	Complete
BoG CISD 2026, Annexure E §j(ii)	Key influencing variables logged and explained	Complete
NIST AI RMF 1.0, §3.5	Explainable and Interpretable characteristic	Complete
NIST AI RMF 1.0, MEASURE 2.9	Model explained, validated, and documented	Complete

EXPLAINABILITY¶

[SHAP findings]¶