import numpy as np
import matplotlib.pyplot as plt
from matplotlib.colors import ListedColormap
from sklearn.datasets import make_moons, make_circles, make_classification
from sklearn.preprocessing import StandardScaler
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score, mean_squared_error


np.random.seed(42)
%matplotlib inline
plt.rcParams.update({'figure.dpi': 110, 'font.size': 11})

def rbf_kernel(X1, X2, length_scale=1.0):
    """
    Compute the RBF (Gaussian) kernel matrix between rows of X1 and X2.

    Parameters
    ----------
    X1 : ndarray of shape (n, d)
    X2 : ndarray of shape (m, d)
    length_scale : float

    Returns
    -------
    K : ndarray of shape (n, m)
    """
    # YOUR CODE HERE
    raise NotImplementedError


def polynomial_kernel(X1, X2, degree=3, c=1.0):
    """
    Compute the polynomial kernel matrix.

    Parameters
    ----------
    X1 : ndarray of shape (n, d)
    X2 : ndarray of shape (m, d)
    degree : int
    c : float — free parameter

    Returns
    -------
    K : ndarray of shape (n, m)
    """
    # YOUR CODE HERE
    raise NotImplementedError

# --- Quick sanity checks (do not modify) ---
X_test = np.array([[1.0, 0.0], [0.0, 1.0]])
K_rbf = rbf_kernel(X_test, X_test, length_scale=1.0)
assert K_rbf.shape == (2, 2), "Shape error"
assert np.allclose(np.diag(K_rbf), 1.0), "Diagonal should be 1 for RBF"
K_poly = polynomial_kernel(X_test, X_test, degree=2, c=1.0)
assert K_poly.shape == (2, 2)
print("Kernel sanity checks passed ✓")

Kernel sanity checks passed ✓

# YOUR CODE HERE
# For each length_scale, compute the kernel matrix on a 1-D grid and plot it.
# Use a 1×3 subplot layout.

# Q3.1 — Generate data
# YOUR CODE HERE
# X_train shape: (80, 1), y_train shape: (80,)

class KernelRidgeRegression:
    """Kernel Ridge Regression via the dual representation."""

    def __init__(self, kernel_fn, lam=1e-3):
        """
        Parameters
        ----------
        kernel_fn : callable  k(X1, X2) -> matrix
        lam       : float     regularisation strength λ
        """
        self.kernel_fn = kernel_fn
        self.lam = lam
        self.alpha_ = None
        self.X_train_ = None

    def fit(self, X, y):
        """
        Solve (K + λI)α = y and store α and X.

        Parameters
        ----------
        X : ndarray (n, d)
        y : ndarray (n,)
        """
        # YOUR CODE HERE
        raise NotImplementedError

    def predict(self, X_star):
        """
        Predict at new inputs X_star.

        Parameters
        ----------
        X_star : ndarray (m, d)

        Returns
        -------
        y_pred : ndarray (m,)
        """
        # YOUR CODE HERE
        raise NotImplementedError

# Q3.3 — Fit and plot for three length-scales
# YOUR CODE HERE

# Q4.1 & Q4.2 — Grid search + heatmap
# YOUR CODE HERE

from sklearn.svm import SVC

def plot_decision_boundary(clf, X, y, ax, title=''):
    """Plot a 2-class decision boundary on ax."""
    # YOUR CODE HERE — build a meshgrid, predict, and plot contourf + scatter
    pass

# Q5.1 Generate data
# YOUR CODE HERE

# Q5.2 Fit SVMs
# YOUR CODE HERE

# Q5.3 Plot
fig, axes = plt.subplots(1, 2, figsize=(12, 4))
# YOUR CODE HERE
plt.tight_layout()
plt.show()

# Q6.1–6.3 — Compare kernels
# YOUR CODE HERE

E2 236 Foundations of ML¶

Lab 4a: Kernel Methods¶

Part A — Dual Representation, RBF & Gaussian Kernels¶

0. Setup & Imports¶

1. Kernel Functions¶

2. Visualising the Kernel Matrix¶

3. Kernel Ridge Regression — Dual Representation¶

4. Effect of Length-Scale and Regularisation¶

5. Kernel SVM Classification¶

6. Comparing Kernels on a Nonlinear Dataset¶

7. The Kernel Matrix is Positive Semi-Definite (Conceptual)¶

End of Part A¶