import numpy as np
import matplotlib.pyplot as plt
from matplotlib.patches import Ellipse

fig, axes = plt.subplots(1, 2, figsize=(13, 4))
rng = np.random.default_rng(5)

means = [[-2, 0], [2, 2], [1, -2]]
covs  = [[[1,0.5],[0.5,1]], [[0.8,0],[0,0.8]], [[1.2,-0.3],[-0.3,0.6]]]
cols  = ['steelblue', 'tomato', 'seagreen']

# ── Diagram 1: Gaussian clouds ────────────────────────────────────────────────
ax = axes[0]
for mu, cov, col in zip(means, covs, cols):
    pts = rng.multivariate_normal(mu, cov, 60)
    ax.scatter(pts[:,0], pts[:,1], c=col, edgecolors='k', s=20, alpha=0.5)
    ax.scatter(*mu, c=col, marker='+', s=200, linewidths=3, zorder=5)
    vals, vecs = np.linalg.eigh(cov)
    angle = np.degrees(np.arctan2(*vecs[:,1][::-1]))
    for nsig in [1, 2]:
        e = Ellipse(mu, 2*nsig*np.sqrt(vals[0]), 2*nsig*np.sqrt(vals[1]),
                    angle=angle, fill=False, color=col, lw=1.5, alpha=0.8)
        ax.add_patch(e)
ax.set_title('Each class modelled as a Gaussian cloud (ellipses = 1σ, 2σ contours)', fontsize=10, fontweight='bold')
ax.set_aspect('equal'); ax.grid(True, linestyle='--', alpha=0.4)

# ── Diagram 2: Bayes rule for classification ───────────────────────────────────
ax = axes[1]
ax.axis('off')
lines = [
    ('Bayes Rule for Classification', True),
    ('', False),
    ('P(y=c | x)  ∝  P(x | y=c)  ×  P(y=c)', False),
    ('', False),
    ('posterior  ∝  likelihood  ×  prior', False),
    ('', False),
    ('Step 1: Fit a Gaussian to each class → get μ, σ²', False),
    ('Step 2: Compute P(x | class) for new point x', False),
    ('Step 3: Multiply by prior P(class)', False),
    ('Step 4: Pick the class with highest posterior', False),
]
for k, (line, bold) in enumerate(lines):
    ax.text(0.05, 0.95-k*0.09, line, transform=ax.transAxes,
            fontsize=11 if bold else 10, fontweight='bold' if bold else 'normal',
            va='top', color='navy' if bold else 'black')

plt.suptitle('Figure 1 — Gaussian Generative Model', fontsize=13, y=1.02)
plt.tight_layout(); plt.show()

%matplotlib inline
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from sklearn.datasets import load_iris
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler
from sklearn.metrics import confusion_matrix

data = load_iris()
X_raw, y = data.data, data.target

X_train_raw, X_test_raw, y_train, y_test = train_test_split(X_raw, y, test_size=0.2, random_state=42, stratify=y)
scaler = StandardScaler()
X_train = scaler.fit_transform(X_train_raw)
X_test  = scaler.transform(X_test_raw)
X = np.vstack([X_train, X_test])  # full standardised set (used only for axis ranges)
print(f'Train: {X_train.shape[0]}  Test: {X_test.shape[0]}')
print(f'Classes: {data.target_names}')
print(f'Features: {data.feature_names}')

Train: 120  Test: 30
Classes: ['setosa' 'versicolor' 'virginica']
Features: ['sepal length (cm)', 'sepal width (cm)', 'petal length (cm)', 'petal width (cm)']

palette = ['steelblue','tomato','seagreen']
fig, axes = plt.subplots(2, 2, figsize=(12, 8))
for ax, feat_idx, fname in zip(axes.flatten(), range(4), data.feature_names):
    for i, (col, name) in enumerate(zip(palette, data.target_names)):
        vals = X_train[y_train==i, feat_idx]
        mu, sigma = vals.mean(), vals.std()
        ax.hist(vals, bins=15, alpha=0.4, color=col, density=True, label=name)
        x_range = np.linspace(vals.min()-0.5, vals.max()+0.5, 100)
        ax.plot(x_range, np.exp(-0.5*((x_range-mu)/sigma)**2)/(sigma*np.sqrt(2*np.pi)),
                c=col, lw=2)
    ax.set_title(fname, fontsize=10, fontweight='bold')
    ax.set_ylabel('Density')
    ax.legend(fontsize=8)
    ax.grid(True, linestyle='--', alpha=0.4)
plt.suptitle('Feature Distributions per Class — with fitted Gaussians', fontsize=12, y=1.01)
plt.tight_layout(); plt.show()

def fit_gaussian(X, y):
    classes = np.unique(y)
    params = {}
    for c in classes:
        Xc = X[y==c]
        mu = Xc.mean(axis=0)
        sigma2 = ((Xc - mu)**2).mean()
        prior = (y==c).mean()
        params[c] = {'mu': mu, 'sigma2': sigma2, 'log_prior': np.log(prior)}
    return params

def log_gaussian(x, mu, sigma2):
    d = len(x)
    return -0.5*d*np.log(2*np.pi*sigma2) - np.sum((x-mu)**2)/(2*sigma2)

def predict_gaussian(X, params):
    preds = []
    for x in X:
        scores = {c: log_gaussian(x, p['mu'], p['sigma2']) + p['log_prior']
                  for c, p in params.items()}
        preds.append(max(scores, key=scores.get))
    return np.array(preds)

params = fit_gaussian(X_train, y_train)
y_pred_train = predict_gaussian(X_train, params)
y_pred_test  = predict_gaussian(X_test,  params)

print(f'Train accuracy: {(y_pred_train==y_train).mean():.2%}')
print(f'Test  accuracy: {(y_pred_test ==y_test ).mean():.2%}')
print()
for c, p in params.items():
    print(f'Class {data.target_names[c]}: mu={np.round(p["mu"],2)}, sigma2={p["sigma2"]:.4f}')

Train accuracy: 85.00%
Test  accuracy: 83.33%

Class setosa: mu=[-1.02  0.82 -1.3  -1.25], sigma2=0.2353
Class versicolor: mu=[ 0.11 -0.67  0.27  0.15], sigma2=0.2258
Class virginica: mu=[ 0.92 -0.15  1.03  1.1 ], sigma2=0.3727

fig, axes = plt.subplots(1, 2, figsize=(13, 5))

cm = confusion_matrix(y_test, y_pred_test)
sns.heatmap(cm, annot=True, fmt='d', cmap='Blues',
            xticklabels=data.target_names, yticklabels=data.target_names,
            ax=axes[0], linewidths=0.5)
axes[0].set_title('Confusion Matrix (Test Set)', fontsize=11, fontweight='bold')
axes[0].set_ylabel('Actual'); axes[0].set_xlabel('Predicted')

ax = axes[1]
f1, f2 = 0, 2  # sepal length vs petal length
x_min, x_max = X[:,f1].min()-0.5, X[:,f1].max()+0.5
y_min, y_max = X[:,f2].min()-0.5, X[:,f2].max()+0.5
xx, yy = np.meshgrid(np.linspace(x_min,x_max,150), np.linspace(y_min,y_max,150))
grid = np.zeros((xx.size, 4))
grid[:,f1] = xx.ravel(); grid[:,f2] = yy.ravel()
zz = predict_gaussian(grid, params).reshape(xx.shape)

ax.contourf(xx, yy, zz, levels=[-0.5,0.5,1.5,2.5],
            colors=['#d4e8f5','#f5d4d4','#d4f5d4'], alpha=0.5)
ax.contour(xx, yy, zz, levels=[0.5,1.5], colors='gray', linewidths=1)
for i, (col, name) in enumerate(zip(palette, data.target_names)):
    m = y_test==i
    ax.scatter(X_test[m,f1], X_test[m,f2], c=col, edgecolors='k', s=60, label=name, zorder=3)
ax.set_xlabel(data.feature_names[f1]); ax.set_ylabel(data.feature_names[f2])
ax.set_title('Decision Regions (sepal length vs petal length)', fontsize=11, fontweight='bold')
ax.legend(fontsize=9); ax.grid(True, linestyle='--', alpha=0.3)
plt.tight_layout(); plt.show()

Class	Test accuracy
Setosa	100%
Versicolour	~73%
Virginica	~73%
Overall	83.33%

Gaussian Generative Model¶

1. Introduction¶

2. The Math¶

Gaussian density¶

MLE for parameters¶

Classification via posterior¶

3. Problem Class¶

4. Implementation¶

Dataset: Iris¶

4.1 Explore Class Distributions¶

4.2 Fit Gaussian Generative Model¶

4.3 Confusion Matrix & Decision Regions¶

5. Results¶

6. Limitations¶