import os
import numpy as np
from scipy.io import loadmat
import matplotlib.pyplot as plt
from matplotlib.lines import Line2D
from math import pi


mat = loadmat(os.path.join("data", "data_class4.mat"))
data = mat["Data"][0]


C = data.shape[0]
C

4


D = data[0].shape[0]
D

2


N = np.zeros(C)
for c in range(C):
    N[c] = data[c].shape[1]
print("N", N)

N [400. 400. 600. 400.]


data[0].shape

(2, 400)


means = []
for c in range(C):
    mu = np.mean(data[c], axis=1)
    means.append(mu)
    print(f"mu {c} = {mu}")
means = np.array(means)

mu 0 = [9.93166666 5.04771704]
mu 1 = [ 6.89476702 -3.06678779]
mu 2 = [-1.96618141 -2.05252646]
mu 3 = [-1.85830966  2.96492564]


# numpy's built-in function for computing covariance matrix

np_covariances = []
for c in range(C):
    cov = np.cov(data[c], ddof=1)
    np_covariances.append(cov)
#     print(f"covariance {c} \n {cov}")
np_covariances = np.array(np_covariances)


# my function for computing covariance matrix (without optimization)

covariances = np.zeros((C, D, D))
for c in range(C):
    for i in range(D):
        for j in range(D):
            cov = np.sum((data[c][i] - means[c][i]) * (data[c][j] - means[c][j])) / (N[c]-1.)
            covariances[c, i, j] = cov
#             print(f"covariance {c} {i} {j} = {cov}")
                
print("covariances\n", covariances)

covariances
 [[[ 2.92878667  1.34060751]
  [ 1.34060751  4.14604723]]

 [[ 1.90650611  1.2951869 ]
  [ 1.2951869   2.03553604]]

 [[ 6.69513194  1.01051255]
  [ 1.01051255  1.17354871]]

 [[ 1.90363212 -0.53673905]
  [-0.53673905  0.66481358]]]


np.sum((data[c][i] - means[c][i])**2) / (N-1)

array([0.66481358, 0.66481358, 0.44283909, 0.66481358])


def compute_eigenvalues(A):
    a = 1
    b = - (A[0, 0] + A[1, 1])
    c = (A[0, 0] * A[1, 1]) - (A[1, 0] * A[0, 1])
    
    def solve_quadratic(a, b, c):
        term1 = np.sqrt((b**2) - (4 * a * c))
        denom = (2 * a)
        ans1 = (-b - term1) / denom
        ans2 = (-b + term1) / denom
        return ans1, ans2

    return solve_quadratic(a, b, c)


eigenvalues, eigenvectors = [], []
for c in range(C):
    val, vec = np.linalg.eig(covariances[c])
    eigenvalues.append(val)
    eigenvectors.append(vec)
#     eigenvalues.append(compute_eigenvalues(covariances[c]))
eigenvalues = np.array(eigenvalues)
eigenvectors = np.array(eigenvectors)


eigenvalues

array([[2.06511966, 5.00971424],
       [0.67422839, 3.26781376],
       [6.87425631, 0.99442435],
       [2.10383047, 0.46461523]])


fig = plt.figure(figsize=(18, 4))
for cc in range(C):
    ax = fig.add_subplot(140 + cc + 1)
    ax.plot([0, eigenvectors[cc, 0, 0]], [0, eigenvectors[cc, 0, 1]])
    ax.plot([0, eigenvectors[cc, 1, 0]], [0, eigenvectors[cc, 1, 1]])
    ax.set_aspect(1)
    ax.set_title(f"Eigenvectors of the class {cc+1}")
plt.show()


test_samples = np.array([[2.3, 1.9], [7, -0.3], [10, 0.5], [-1.2, 0.6]])


def visualize_space(data, means, eigenvalues, eigenvectors, title=None, save_name=None, figsize=(10, 9), test_samples=None, test_index=None, distances=None, norm="2"):
    fig = plt.figure(figsize=figsize)
    ax = fig.add_subplot(111)
    colors = ["blue", "red", "orange", "green"]
    for c in range(C):
        # patterns
        ax.scatter(data[c][0], data[c][1], color=colors[c], label=f"class {c+1}")
        # mean
        mean_x, mean_y = means[c]
        ax.scatter(mean_x, mean_y, color=colors[c], marker="*", edgecolor="black", s=150, linewidth=2, label=f"mean {c+1}")
        # variance
        theta = np.linspace(0, 2*np.pi, 100)

        major_idx = np.argmax(eigenvalues[c])
#         minor_idx = np.argmin(eigenvalues[c])
        # HOTFIX: argmax = argmin causes a problem
        minor_idx = 1 if major_idx == 0 else 0
        alpha = np.arctan2(eigenvectors[c, 1, major_idx], eigenvectors[c, 0, major_idx])
        major_r_x = eigenvalues[c, major_idx]
        major_r_y = eigenvalues[c, minor_idx]
        AXIS_COLORS = ["black", "grey"]
        axis_colors = [AXIS_COLORS[major_idx], AXIS_COLORS[minor_idx]]

        e_X = major_r_x * np.cos(theta) * np.cos(alpha) - major_r_y * np.sin(theta) * np.sin(alpha) + mean_x
        e_Y = major_r_x * np.cos(theta) * np.sin(alpha) + major_r_y * np.sin(theta) * np.cos(alpha) + mean_y
        ax.plot(e_X, e_Y, color="black", linestyle="--")

        ax.plot([mean_x, mean_x+eigenvalues[c, major_idx]*eigenvectors[c, 0, major_idx]], [mean_y, mean_y+eigenvalues[c, major_idx]*eigenvectors[c, 1, major_idx]], linewidth=3, color=axis_colors[0])
        ax.plot([mean_x, mean_x+eigenvalues[c, minor_idx]*eigenvectors[c, 0, minor_idx]], [mean_y, mean_y+eigenvalues[c, minor_idx]*eigenvectors[c, 1, minor_idx]], linewidth=3, color=axis_colors[1])
#         print(np.power((mean_x+eigenvalues[c, major_idx]*eigenvectors[c, 0, major_idx]) - mean_x, 2) + np.power((mean_y+eigenvalues[c, major_idx]*eigenvectors[c, 1, major_idx]) - mean_y, 2))
#         print(np.power((mean_x+eigenvalues[c, minor_idx]*eigenvectors[c, 0, minor_idx]) - mean_x, 2) + np.power((mean_y+eigenvalues[c, minor_idx]*eigenvectors[c, 1, minor_idx]) - mean_y, 2))

    # test samples
    if test_samples is not None:
        ax.scatter(test_samples[:, 0], test_samples[:, 1], color="deeppink", marker="x", label="test samples", edgecolor="black", s=50, linewidth=3)
    # distances
    if distances is not None:
        s_x, s_y = test_samples[test_index, 0], test_samples[test_index, 1]
        for c in range(C):
            mu_x, mu_y = means[c]
            ax.plot([s_x, mu_x], [s_y, mu_y], linewidth=3, color="plum")
            ax.text((s_x + mu_x) / 2, (s_y + mu_y) / 2, f"{distances[c]:.2f}")
        predicted_c = np.argmin(distances)
        print("predicted_c", predicted_c + 1)
        ax.plot([s_x, means[predicted_c, 0]], [s_y, means[predicted_c, 1]], linewidth=3, color="darkviolet", label=f"$\\min ||\\vec \mu_i  - \\vec s_j||_{norm}$")

    ax.set_xlabel("$x_1$")
    ax.set_ylabel("$x_2$")

    handles, labels = ax.get_legend_handles_labels()
    handles.append(Line2D([0], [0], color="black", linewidth=3, linestyle='--'))
    labels.append("$\sigma^2_{c}$")
    
    if distances is not None:
        handles.insert(0, Line2D([0], [0], color="plum", linewidth=3, linestyle='-'))
        labels.insert(0, f"$||\\vec \mu_i  - \\vec s_j||_{norm}$")
        
    ax.set_aspect(1)

    plt.legend(handles, labels)
    if title is not None:
        plt.title(title)
    plt.tight_layout()
#     if save_name is not None:
#         plt.savefig(save_name, dpi=300)


visualize_space(data, means, eigenvalues, eigenvectors, title="Dataset - Original Feature Space", save_name="dataset-original_feature_space.png", test_samples=test_samples) # (10, 7)


J = test_samples.shape[0]
distances = np.zeros((C, J))

def euclidean_distance(x, y):
    return np.sqrt(np.sum(np.power(x - y, 2)))

for c in range(C):
    for j in range(J):
        distances[j, c] = euclidean_distance(test_samples[j], means[c])

distances

array([[ 8.2553291 ,  6.76615584,  5.81573462,  4.29250578],
       [ 6.09858565,  2.7687883 ,  9.13585015,  9.44083627],
       [ 4.5482304 ,  4.72910637, 12.23539492, 12.11178626],
       [11.98733454,  8.88653958,  2.76096551,  2.45484111]])


for j in range(J): # each test sample
    visualize_space(data, means, eigenvalues, eigenvectors, title=f"Test sample $s_{j+1}$ classification using Euclidean distance", save_name=f"test_samples-euclidean_distances-{j+1}.png", test_samples=test_samples, test_index=j, distances=distances[j]) # (10, 7)

predicted_c 4
predicted_c 2
predicted_c 1
predicted_c 4


def print_report_table(distances):
    for i in range(distances.shape[0]):
        print(f"| s{i+1} | ", end="")
        for j in range(distances.shape[1]):
            print(f"{distances[i, j]:.4f}", end=" | ")
        c = np.argmin(distances[i])
        print(f"class {c+1} | ")


print_report_table(distances)

| s1 | 8.2553 | 6.7662 | 5.8157 | 4.2925 | class 4 | 
| s2 | 6.0986 | 2.7688 | 9.1359 | 9.4408 | class 2 | 
| s3 | 4.5482 | 4.7291 | 12.2354 | 12.1118 | class 1 | 
| s4 | 11.9873 | 8.8865 | 2.7610 | 2.4548 | class 4 |


squishing_matrices = np.zeros_like(covariances)
whitened_data = np.zeros_like(data)
whitened_means = np.zeros_like(means)
whitened_covariances = np.zeros_like(covariances)
whitened_eigenvalues = np.zeros_like(eigenvalues)
whitened_eigenvectors = np.zeros_like(eigenvectors)

for c in range(C):
    squishing_matrices[c] = np.sqrt(np.linalg.inv(np.identity(D) * eigenvalues[c]))
    whitened_data[c] = squishing_matrices[c] @ eigenvectors[c].T @ data[c]
    whitened_means[c] = squishing_matrices[c] @ eigenvectors[c].T @ means[c]
    whitened_covariances[c] = squishing_matrices[c] @ eigenvectors[c].T @ covariances[c] @ eigenvectors[c] @ squishing_matrices[c]
    whitened_eigenvalues[c], whitened_eigenvectors[c] = np.linalg.eig(np.cov(whitened_data[c]))


whitened_covariances

array([[[ 1.00000000e+00,  4.96025213e-17],
        [ 0.00000000e+00,  1.00000000e+00]],

       [[ 1.00000000e+00,  1.53540019e-16],
        [ 1.35209346e-16,  1.00000000e+00]],

       [[ 1.00000000e+00, -1.11333113e-16],
        [-1.16447472e-16,  1.00000000e+00]],

       [[ 1.00000000e+00,  0.00000000e+00],
        [ 7.65428907e-17,  1.00000000e+00]]])


fig = plt.figure(figsize=(18, 4))
for cc in range(C):
    ax = fig.add_subplot(140 + cc + 1)
    ax.plot([0, whitened_eigenvectors[cc, 0, 0]], [0, whitened_eigenvectors[cc, 0, 1]])
    ax.plot([0, whitened_eigenvectors[cc, 1, 0]], [0, whitened_eigenvectors[cc, 1, 1]])
    ax.set_aspect(1)
    ax.set_title(f"Eigenvectors of the whitened class {cc+1}")
plt.show()


whitened_test_samples= np.zeros((test_samples.shape[0], C, test_samples.shape[1]))

for j in range (J):
    for c in range(C):
        whitened_test_samples[j, c] = squishing_matrices[c] @ eigenvectors[c].T @ test_samples[j]

whitened_test_samples.shape

(4, 4, 2)


visualize_space(whitened_data, whitened_means, whitened_eigenvalues, whitened_eigenvectors, title="Dataset - Whitened Feature Space", save_name="dataset-whitened_feature_space.png")


whitened_distances = np.zeros_like(distances)

for c in range(C):
    for j in range(J):
        whitened_distances[j, c] = euclidean_distance(whitened_test_samples[j, c], whitened_means[c])

whitened_distances

array([[ 4.4631794 ,  8.2269217 ,  3.66605299,  3.01760914],
       [ 2.73444094,  2.50838516,  3.48764967,  6.50903569],
       [ 2.43665098,  2.62587407,  4.68324731,  8.68172594],
       [ 6.51365692, 10.34740388,  2.52802512,  3.07849649]])


def visualize_whitened_space(data, means, eigenvalues, eigenvectors, title=None, save_name=None, figsize=(20, 6), test_samples=None, test_index=None, distances=None, norm="2"):
    fig, axs = plt.subplots(nrows=1, ncols=C, figsize=figsize)
    colors = ["blue", "red", "orange", "green"]
    for c in range(C):
        ax = axs[c]
        # patterns
        ax.scatter(data[c][0], data[c][1], color=colors[c], label=f"class {c+1}")
        # mean
        mean_x, mean_y = means[c]
        ax.scatter(mean_x, mean_y, color=colors[c], marker="*", edgecolor="black", s=150, linewidth=2, label=f"mean {c+1}")
        # variance
        theta = np.linspace(0, 2*np.pi, 100)

        major_idx = np.argmax(eigenvalues[c])
#         minor_idx = np.argmin(eigenvalues[c])
        # HOTFIX: argmax = argmin causes a problem
        minor_idx = 1 if major_idx == 0 else 0
        alpha = np.arctan2(eigenvectors[c, 1, major_idx], eigenvectors[c, 0, major_idx])
        major_r_x = eigenvalues[c, major_idx]
        major_r_y = eigenvalues[c, minor_idx]
        AXIS_COLORS = ["black", "grey"]
        axis_colors = [AXIS_COLORS[major_idx], AXIS_COLORS[minor_idx]]

        e_X = major_r_x * np.cos(theta) * np.cos(alpha) - major_r_y * np.sin(theta) * np.sin(alpha) + mean_x
        e_Y = major_r_x * np.cos(theta) * np.sin(alpha) + major_r_y * np.sin(theta) * np.cos(alpha) + mean_y
        ax.plot(e_X, e_Y, color="black", linestyle="--")

        ax.plot([mean_x, mean_x+eigenvalues[c, major_idx]*eigenvectors[c, 0, major_idx]], [mean_y, mean_y+eigenvalues[c, major_idx]*eigenvectors[c, 1, major_idx]], linewidth=3, color=axis_colors[0])
        ax.plot([mean_x, mean_x+eigenvalues[c, minor_idx]*eigenvectors[c, 0, minor_idx]], [mean_y, mean_y+eigenvalues[c, minor_idx]*eigenvectors[c, 1, minor_idx]], linewidth=3, color=axis_colors[1])
#         ax.quiver(mean_x, mean_y, eigenvectors[c, 0, major_idx], eigenvectors[c, 1, major_idx], scale=eigenvalues[c, major_idx], scale_units="xy", linewidth=3, color="orange")
#         ax.quiver(mean_x, mean_y, eigenvectors[c, 0, minor_idx], eigenvectors[c, 1, minor_idx], scale=eigenvalues[c, minor_idx], scale_units="xy", linewidth=3, color="yellow")
#         print(np.power((mean_x+eigenvalues[c, major_idx]*eigenvectors[c, 0, major_idx]) - mean_x, 2) + np.power((mean_y+eigenvalues[c, major_idx]*eigenvectors[c, 1, major_idx]) - mean_y, 2))
#         print(np.power((mean_x+eigenvalues[c, minor_idx]*eigenvectors[c, 0, minor_idx]) - mean_x, 2) + np.power((mean_y+eigenvalues[c, minor_idx]*eigenvectors[c, 1, minor_idx]) - mean_y, 2))

        # test samples
        if test_samples is not None:
            ax.scatter(test_samples[c, 0], test_samples[c, 1], color="deeppink", marker="x", label="test samples", edgecolor="black", s=50, linewidth=3)
        # distances
        if distances is not None:
            s_x, s_y = test_samples[c, 0], test_samples[c, 1]
            mu_x, mu_y = means[c]
            ax.plot([s_x, mu_x], [s_y, mu_y], linewidth=3, color="plum")
            ax.text((s_x + mu_x) / 2, (s_y + mu_y) / 2, f"{distances[c]:.2f}")

        ax.set_xlabel("$x_1$")
        ax.set_ylabel("$x_2$")

        handles, labels = ax.get_legend_handles_labels()
        handles.append(Line2D([0], [0], color="black", linewidth=3, linestyle='--'))
        labels.append("$\sigma^2_{c}$")

        if distances is not None:
            handles.insert(0, Line2D([0], [0], color="plum", linewidth=3, linestyle='-'))
            labels.insert(0, f"$||\\vec \mu_i  - \\vec s_j||_{norm}$")

        ax.legend(handles, labels)
        
        ax.set_aspect(1)
        
    if title is not None:
        plt.suptitle(title)
    plt.tight_layout()
#     if save_name is not None:
#         plt.savefig(save_name, dpi=300)


for j in range(J):
    visualize_whitened_space(whitened_data, whitened_means, whitened_eigenvalues, whitened_eigenvectors, title=f"Whitened test sample $s_{j+1}$ classification using Euclidean distance in the whitened space", save_name=f"whitened_test_samples-euclidean_distances-{j+1}.png", test_samples=whitened_test_samples[j], test_index=j, distances=whitened_distances[j])


# for filling in the report table

print_report_table(whitened_distances)

| s1 | 4.4632 | 8.2269 | 3.6661 | 3.0176 | class 4 | 
| s2 | 2.7344 | 2.5084 | 3.4876 | 6.5090 | class 2 | 
| s3 | 2.4367 | 2.6259 | 4.6832 | 8.6817 | class 1 | 
| s4 | 6.5137 | 10.3474 | 2.5280 | 3.0785 | class 3 |


def mahalanobis_distance(x, mean, inv_cov):
    return np.sqrt((x - mean).T @ inv_cov @ (x - mean))

mahalanobis_distances = np.zeros_like(distances)
for c in range(C):
    inv_cov = np.linalg.inv(covariances[c])
    for j in range(J):
        mahalanobis_distances[j, c] = mahalanobis_distance(test_samples[j], means[c], inv_cov)

mahalanobis_distances

array([[ 4.4631794 ,  8.2269217 ,  3.66605299,  3.01760914],
       [ 2.73444094,  2.50838516,  3.48764967,  6.50903569],
       [ 2.43665098,  2.62587407,  4.68324731,  8.68172594],
       [ 6.51365692, 10.34740388,  2.52802512,  3.07849649]])


for j in range(J): # each test sample
    visualize_space(data, means, eigenvalues, eigenvectors, title=f"Test sample $s_{j+1}$ classification using Mahalanobis distance", save_name=f"test_samples-mahalanobis_distances-{j+1}.png", test_samples=test_samples, test_index=j, distances=mahalanobis_distances[j], norm="M") # (10, 7)

predicted_c 4
predicted_c 2
predicted_c 1
predicted_c 3


print_report_table(mahalanobis_distances)

| s1 | 4.4632 | 8.2269 | 3.6661 | 3.0176 | class 4 | 
| s2 | 2.7344 | 2.5084 | 3.4876 | 6.5090 | class 2 | 
| s3 | 2.4367 | 2.6259 | 4.6832 | 8.6817 | class 1 | 
| s4 | 6.5137 | 10.3474 | 2.5280 | 3.0785 | class 3 |


"Original means", means

('Original means',
 array([[ 9.93166666,  5.04771704],
        [ 6.89476702, -3.06678779],
        [-1.96618141, -2.05252646],
        [-1.85830966,  2.96492564]]))


"Whitened means", whitened_means

('Whitened means',
 array([[-3.90753781, -4.29897461],
        [-8.65781466, -1.39993863],
        [-0.87503941, -1.68254033],
        [-1.91477051,  3.12275049]]))


covariances

array([[[ 2.92878667,  1.34060751],
        [ 1.34060751,  4.14604723]],

       [[ 1.90650611,  1.2951869 ],
        [ 1.2951869 ,  2.03553604]],

       [[ 6.69513194,  1.01051255],
        [ 1.01051255,  1.17354871]],

       [[ 1.90363212, -0.53673905],
        [-0.53673905,  0.66481358]]])


whitened_covariances

array([[[ 1.00000000e+00,  4.96025213e-17],
        [ 0.00000000e+00,  1.00000000e+00]],

       [[ 1.00000000e+00,  1.53540019e-16],
        [ 1.35209346e-16,  1.00000000e+00]],

       [[ 1.00000000e+00, -1.11333113e-16],
        [-1.16447472e-16,  1.00000000e+00]],

       [[ 1.00000000e+00,  0.00000000e+00],
        [ 7.65428907e-17,  1.00000000e+00]]])


I = []
for c in range(C):
    I.append(np.identity(whitened_covariances[c].shape[0]))
I = np.array(I)
I

array([[[1., 0.],
        [0., 1.]],

       [[1., 0.],
        [0., 1.]],

       [[1., 0.],
        [0., 1.]],

       [[1., 0.],
        [0., 1.]]])


"Whitened covariance matrices = identity matrices", np.allclose(whitened_covariances, I)

('Whitened covariance matrices = identity matrices', True)


"Euclidean distances in the original feature space", distances

('Euclidean distances in the original feature space',
 array([[ 8.2553291 ,  6.76615584,  5.81573462,  4.29250578],
        [ 6.09858565,  2.7687883 ,  9.13585015,  9.44083627],
        [ 4.5482304 ,  4.72910637, 12.23539492, 12.11178626],
        [11.98733454,  8.88653958,  2.76096551,  2.45484111]]))


"Euclidean distances in the whitened space", whitened_distances, "Mahalanobis distances", mahalanobis_distances

('Euclidean distances in the whitened space',
 array([[ 4.4631794 ,  8.2269217 ,  3.66605299,  3.01760914],
        [ 2.73444094,  2.50838516,  3.48764967,  6.50903569],
        [ 2.43665098,  2.62587407,  4.68324731,  8.68172594],
        [ 6.51365692, 10.34740388,  2.52802512,  3.07849649]]),
 'Mahalanobis distances',
 array([[ 4.4631794 ,  8.2269217 ,  3.66605299,  3.01760914],
        [ 2.73444094,  2.50838516,  3.48764967,  6.50903569],
        [ 2.43665098,  2.62587407,  4.68324731,  8.68172594],
        [ 6.51365692, 10.34740388,  2.52802512,  3.07849649]]))


"Are they equivalent?", np.allclose(mahalanobis_distances, whitened_distances)

('Are they equivalent?', True)

Mini Project 1

Watchanan Chantapakul (`wcgzm`)

Part A: Original feature space and Euclidean distance¶

1. Estimate the mean and covariance of each class distribution using a library function (i.e. Matlab toolbox, or Python statistics package, etc.). Report on their values.¶

Compute means $\mu$ ¶

Compute variances $\sigma^2$ ¶

Check that the computed eigenvectors are perpendicular to each other.¶

2. Plot the data in each of the four classes using different colors and display their eigen-vectors.¶

3. Consider the following four test samples in the table below 1:¶

(a) On the same previous plot, display the four test samples.¶

Ellipse equation ¶

(b) Compute the Euclidean distances $d(\mu_i, s_j)$ between the center of each class $i = 1, 2, 3, 4$ and the test samples $j = 1, 2, 3, 4.$ ¶

Classification based on Euclidean distance¶

(c) Classify the test samples accordingly and report the results in the following table 2:¶

Part B: Whitened space and Euclidean distance¶

1. Apply a whitening transformation to the data in each of the classes according to their own parameters (i.e. Mean and Covariance)¶

Whitened mean¶

Whitened covariance¶

Whitened data sample¶

Check that the computed eigenvectors are perpendicular to each other.¶

Whitened test sample¶

Classification based on Euclidean distance in the whitened spaces¶

2. Repeat questions A.1, A.2 and A.3. but this time using the whitened data and whitened testing samples and report the results in the following table 3:¶

Part C: Original feature space and Mahalanobis distance¶

1. Using the original dataset from Part A (ie. before whitening), repeat question A.3 using the Mahalanobis distances instead of the Euclidean $r(\mu_i, s_j)$ and report the results in the following table 4.¶

Mahalanobis distance¶

Classification based on Mahalanobis distance in the original feature spaces¶

2. Compare Tables 2, 3, 4 and comment on the classification results.¶

Report:¶

Comparing mean vectors¶

Comparing covariance matrices¶

Whitened covariance matrices = identity matrices¶

Comparing 3 distances¶

Why are they the same?¶

Test Samples	d( $\mu_1$ , $s_j$ )	d( $\mu_2$ , $s_j$ )	d( $\mu_3$ , $s_j$ )	d( $\mu_4$ , $s_j$ )	Class Assignment
s1	8.2553	6.7662	5.8157	4.2925	class 4
s2	6.0986	2.7688	9.1359	9.4408	class 2
s3	4.5482	4.7291	12.2354	12.1118	class 1
s4	11.9873	8.8865	2.7610	2.4548	class 4

Test Samples	d( $\mu_1$ , $s_j$ )	d( $\mu_2$ , $s_j$ )	d( $\mu_3$ , $s_j$ )	d( $\mu_4$ , $s_j$ )	Class Assignment
s1	4.4632	8.2269	3.6661	3.0176	class 4
s2	2.7344	2.5084	3.4876	6.5090	class 2
s3	2.4367	2.6259	4.6832	8.6817	class 1
s4	6.5137	10.3474	2.5280	3.0785	class 3

Test Samples	x-value	y-value
s1	2.3	1.9
s2	7	-0.3
s3	10	0.5
s4	-1.2	0.6

Mini Project 1

Watchanan Chantapakul (wcgzm)

Part A: Original feature space and Euclidean distance¶

1. Estimate the mean and covariance of each class distribution using a library function (i.e. Matlab toolbox, or Python statistics package, etc.). Report on their values.¶

Compute means μ\mu¶

Compute variances σ2\sigma^2¶

Check that the computed eigenvectors are perpendicular to each other.¶

2. Plot the data in each of the four classes using different colors and display their eigen-vectors.¶

3. Consider the following four test samples in the table below 1:¶

(a) On the same previous plot, display the four test samples.¶

Ellipse equation¶

(b) Compute the Euclidean distances d(μi,sj)d(\mu_i, s_j) between the center of each class i=1,2,3,4i = 1, 2, 3, 4 and the test samples j=1,2,3,4.j = 1, 2, 3, 4.¶

Classification based on Euclidean distance¶

(c) Classify the test samples accordingly and report the results in the following table 2:¶

Part B: Whitened space and Euclidean distance¶

1. Apply a whitening transformation to the data in each of the classes according to their own parameters (i.e. Mean and Covariance)¶

Whitened mean¶

Whitened covariance¶

Whitened data sample¶

Check that the computed eigenvectors are perpendicular to each other.¶

Whitened test sample¶

Classification based on Euclidean distance in the whitened spaces¶

2. Repeat questions A.1, A.2 and A.3. but this time using the whitened data and whitened testing samples and report the results in the following table 3:¶

Part C: Original feature space and Mahalanobis distance¶

1. Using the original dataset from Part A (ie. before whitening), repeat question A.3 using the Mahalanobis distances instead of the Euclidean r(μi,sj)r(\mu_i, s_j) and report the results in the following table 4.¶

Mahalanobis distance¶

Classification based on Mahalanobis distance in the original feature spaces¶

2. Compare Tables 2, 3, 4 and comment on the classification results.¶

Report:¶

Comparing mean vectors¶

Comparing covariance matrices¶

Whitened covariance matrices = identity matrices¶

Comparing 3 distances¶

Why are they the same?¶

Watchanan Chantapakul (`wcgzm`)

Compute means $\mu$ ¶

Compute variances $\sigma^2$ ¶

Ellipse equation ¶

(b) Compute the Euclidean distances $d(\mu_i, s_j)$ between the center of each class $i = 1, 2, 3, 4$ and the test samples $j = 1, 2, 3, 4.$ ¶

1. Using the original dataset from Part A (ie. before whitening), repeat question A.3 using the Mahalanobis distances instead of the Euclidean $r(\mu_i, s_j)$ and report the results in the following table 4.¶