import numpy as np
from numpy.random import default_rng
rng = default_rng(0)    # good practice for reproducibility

def gauss_sample(N, c, Sigma):
    """
    returns N samples from a multivariate Gaussian 
    with mean c and covariance matrix Sigma
    """
    m = len(c)
    L = np.linalg.cholesky(Sigma)
    z = rng.normal(size=(m, N))
    x = c[:,None] + np.dot(L, z)
    return x

# Solution
import numpy as np

def my_cov(X):
    """
    estimates the covariance matrix of the (real-valued) data matrix X
    """
    _, N = X.shape
    Xc = X - X.mean(axis=1).reshape(-1,1) # mean centering
    return np.dot(Xc,Xc.T)/(N-1)

# testing code
N = 1000
c = np.array([4, -2])
Sigma = np.array([[2, 0.5], [0.5, 1]])
X = gauss_sample(N, c, Sigma)
print('covariance matrix estimated from data:\n', my_cov(X))

# Note: this will only work for truly 2D NumPy arrays; 
# try my_cov(X[0,:]) to see it fail vs my_cov(X[0:1,:])

covariance matrix estimated from data:
 [[1.9100027  0.55528846]
 [0.55528846 1.0743857 ]]

# Solution
def gauss_density_2d(X0, X1, c, Sigma):
    # get distance from c for each X0,X1 pair
    X0c = X0 - c[0]  
    X1c = X1 - c[1]
    # matrix vector product inv(Sigma)*[X0c;X1c] using 
    # formula for inverse of 2x2 matrix (may fail for ill-conditioned Sigma)
    det = Sigma[0,0]*Sigma[1,1] - Sigma[1,0]*Sigma[0,1]  # det(Sigma)
    Sigmainv = [[Sigma[1,1] , -Sigma[0,1]], [-Sigma[1,0] , Sigma[0,0]]]/det  
    SigmainvX0c = Sigmainv[0,0]*X0c + Sigmainv[0,1]*X1c
    SigmainvX1c = Sigmainv[1,0]*X0c + Sigmainv[1,1]*X1c
    # inner product of [X0c;X1c] with Sigmainv*[X0c;X1c]
    ip = X0c*SigmainvX0c + X1c*SigmainvX1c
    m = 2
    norm_const = 1 / (np.sqrt((2 * np.pi)**m * det))
    return norm_const * np.exp(-0.5 * ip)

import matplotlib.pyplot as plt
from time import time
st = time()

# contour plot of Gaussian density function in 2d
x0 = np.linspace(-2, 10, 100)
x1 = np.linspace(-7, 3, 100)
X0, X1 = np.meshgrid(x0, x1)

Z1 = gauss_density_2d(X0, X1, c, Sigma)
print("evaluating Z took", time()-st, "seconds")
plt.contourf(X0, X1, Z1, levels=[0, 0.01, 0.05, 0.1, 0.2], cmap=plt.cm.Blues);
plt.colorbar();
plt.scatter(X[0,:], X[1,:], s=2, c='r')
plt.axis('tight'), plt.title('Gaussian density'); plt.show();

evaluating Z took 0.0 seconds

# We first need to copy over some functions and variables from the course notes.

# list of centers and covariance matrices for each class
c_ = { 0: np.array([4, -2]), 
       1: np.array([10, 3]), 
       2: np.array([5, 4]) }
Sigma_ = { 0: np.array([[2, 0.5], [0.5, 1]]), 
           1: np.array([[0.3, 0.2], [0.2, 0.8]]), 
           2: np.array([[1, 0.5], [0.5, 1]]) }

def multiple_classes(N, c_, Sigma_):
    """
    returns N samples of 2d data from multiple classes
    """
    nr_classes = len(c_)
    n0 = N//nr_classes
    X = np.zeros((2, 0))
    y = np.zeros(0)
    for i in range(nr_classes):
        if i == nr_classes-1:
            n0 = N - (nr_classes-1)*n0
        X = np.hstack((X, gauss_sample(n0, c_[i], Sigma_[i])))
        y = np.hstack((y, i*np.ones(n0)))

    # important: always shuffle the order of your data points
    p = rng.permutation(N)
    X = X[:,p]
    y = y[p]
    return X, y

def h_coord_split(x):
    if x[0] > 8:
        return 1
    if x[1] > 1:
        return 2
    return 0

loss_01 = lambda y, yp: y != yp

def empirical_err(h, loss, X, y):
    s = 0
    for n in range(len(y)):
        s += loss(y[n], h(X[:,n]))
    return s/len(y)

# Convergence of the empirical error to 
# the true generalisation error (sqrt(N))

limit = 0.00211238
rng = default_rng(0) 

for N in [10, 100, 1000, 10000, 10000, 1000000]:
    Xnew, ynew = multiple_classes(N, c_, Sigma_)
    val = empirical_err(h_coord_split, loss_01, Xnew, ynew)
    print(N, val, np.abs(val - limit))

10 0.0 0.00211238
100 0.0 0.00211238
1000 0.001 0.00111238
10000 0.0021 1.2380000000000203e-05
10000 0.0026 0.0004876199999999998
1000000 0.002096 1.6379999999999867e-05

Exercise 4.1¶

Exercise 4.2¶

Exercise 4.3¶

Exercise 4.4¶

Exercise 4.5¶

Exercise 4.6¶