import numpy as np
from IPython.display import display, Math
import matplotlib.pyplot as plt


class1_samples = np.array([
    [0.42, -0.087, 0.58],
    [-0.2, -3.3, -3.4],
    [1.3, -0.32, 1.7],
    [0.39, 0.71, 0.23],
    [-1.6, -5.3, -0.15],
    [-0.029, 0.89, -4.7],
    [-0.23, 1.9, 2.2],
    [0.27, -0.3, -0.87],
    [-1.9, 0.76, -2.1],
    [0.87, -1.0, -2.6]
])

class2_samples = np.array([
    [-0.4, 0.58, 0.089],
    [-0.31, 0.27, -0.04],
    [0.38, 0.055, -0.035],
    [-0.15, 0.53, 0.011],
    [-0.35, 0.47, 0.034],
    [0.17, 0.69, 0.1],
    [-0.011, 0.55, -0.18],
    [-0.27, 0.61, 0.12],
    [-0.065, 0.49, 0.0012],
    [-0.12, 0.054, -0.063]
])

class3_samples = np.array([
    [0.83, 1.6, -0.014],
    [1.1, 1.6, 0.48],
    [-0.44, -0.41, 0.32],
    [0.047, -0.45, 1.4],
    [0.28, 0.35, 3.1],
    [-0.39, -0.48, 0.11],
    [0.34, -0.079, 0.14],
    [-0.3, -0.22, 2.2],
    [1.1, 1.2, -0.46],
    [0.18, -0.11, -0.49]
])

samples = np.array([class1_samples, class2_samples, class3_samples])


def answer(text, ans):
    if type(ans) == np.ndarray:
        t = r'\begin{bmatrix} '
        for i in ans:
#             print(i, type(i))
#             print(r' \\ '.join(i))
            if type(i) != np.ndarray:
                t += f'{i:.4f}' + r' \\ '
            else:
                a_str = np.array2string(i, precision=4, separator=r' & ')
                t += a_str[1:-1]
                t += r' \\ '
        t += r'\end{bmatrix}'
        display(Math(f'{text} = {t}'))
    else:
        display(Math(f'{text} = {ans:.4f}'))


def mean(samples):
    return np.sum(samples) / np.size(samples)


a_samples1 = class1_samples[:, 0]
a_samples2 = class1_samples[:, 1]
a_samples3 = class1_samples[:, 2]


a_mu1 = mean(a_samples1)
a_mu2 = mean(a_samples2)
a_mu3 = mean(a_samples3)


answer("\mu_1", a_mu1)
answer("\mu_2", a_mu2)
answer("\mu_3", a_mu3)


def variance(samples, mean):
    return np.sum((samples - mean) ** 2) / (np.size(samples) - 1)


a_var1 = variance(a_samples1, a_mu1)
a_var2 = variance(a_samples2, a_mu2)
a_var3 = variance(a_samples3, a_mu3)


answer("\sigma_1^2", a_var1)
answer("\sigma_2^2", a_var2)
answer("\sigma_3^2", a_var3)


b_samples1 = class1_samples[:, [0, 1]]
b_samples2 = class1_samples[:, [0, 2]]
b_samples3 = class1_samples[:, [1, 2]]


def b_mean(samples):
    return np.sum(samples, axis=0) / samples.shape[0]


b_mu1 = b_mean(b_samples1)
b_mu2 = b_mean(b_samples2)
b_mu3 = b_mean(b_samples3)


answer(r"\vec{\mu}_1", b_mu1)
answer(r"\vec{\mu}_2", b_mu2)
answer(r"\vec{\mu}_3", b_mu3)


def b_covariance(samples, mu):
    cov = np.zeros((len(mu), len(mu)))
    for x in samples:
        diff = x - mu
        cov += diff[:, None] @ diff.T[None, :]
    cov /= len(samples) - 1
    return cov


b_cov1 = b_covariance(b_samples1, b_mu1)
b_cov2 = b_covariance(b_samples2, b_mu2)
b_cov3 = b_covariance(b_samples3, b_mu3)


# np.cov(samples1.T, ddof=1)


answer("\Sigma_1", b_cov1)
answer("\Sigma_2", b_cov2)
answer("\Sigma_3", b_cov3)


c_samples = class1_samples


# np.cov(c_samples.T, ddof=1)


c_mu = b_mean(c_samples)


answer(r"\vec{\mu}", c_mu)


c_cov = b_covariance(c_samples, c_mu)


answer("\Sigma", c_cov)


d_samples1 = class2_samples[:, 0]
d_samples2 = class2_samples[:, 1]
d_samples3 = class2_samples[:, 2]


d_mu1 = mean(d_samples1)
d_mu2 = mean(d_samples2)
d_mu3 = mean(d_samples3)


answer("\mu_1", d_mu1)
answer("\mu_2", d_mu2)
answer("\mu_3", d_mu3)


d_var1 = variance(d_samples1, d_mu1)
d_var2 = variance(d_samples2, d_mu2)
d_var3 = variance(d_samples3, d_mu3)


answer("\sigma_1^2", d_var1)
answer("\sigma_2^2", d_var2)
answer("\sigma_3^2", d_var3)


d_cov = np.identity(3) * np.array([d_var1, d_var2, d_var3])


answer("\Sigma", d_cov)


D = class2_samples[:, 1]
D

array([0.58 , 0.27 , 0.055, 0.53 , 0.47 , 0.69 , 0.55 , 0.61 , 0.49 ,
       0.054])


def likelihood_dist(x, mu, delta):
    if np.abs(x - mu) < delta:
        return (delta - np.abs(x - mu)) / (delta ** 2)
    return 0


fig, ax = plt.subplots()
X = np.arange(-5, 5, 0.01)
Y = [likelihood_dist(x, 0, 2) for x in X]
ax.plot(X, Y, linewidth=4)
ax.set_xlabel("$x$")
ax.set_ylabel(r"$p(x|\theta)$")
plt.show()


def prior_dist(x, a, b):
    if a <= x and x <= b:
        return 1. / (b - a)
    return 0


fig, ax = plt.subplots()
X = np.arange(-0.5, 1.5, 0.01)
Y = [prior_dist(x, 0, 1) for x in X]
Y /= np.sum(Y)
ax.plot(X, Y, linewidth=4)
ax.set_xlabel(r"$\theta$")
ax.set_ylabel(r"$p(\theta)$")
plt.show()


D.min(), D.max()

(0.054, 0.69)


initial_delta = 2


mu = np.arange(0, 1.001, 0.001)


U_a = D.min()
U_b = D.max()


pTheta = [prior_dist(m, U_a, U_b) for m in mu]
pTheta /= np.sum(pTheta)


fig, ax = plt.subplots()
X = mu
Y = pTheta
ax.plot(X, Y, linewidth=4)
ax.set_xlabel(r"$\theta$")
ax.set_ylabel(r"$p(\theta)$")
plt.show()


np.sum(pTheta)

0.9999999999999996


posteriors = []
for m, p_theta in zip(mu, pTheta):
    p_theta_D_posterior = 1
    for x in D:
        p_theta_D_posterior *= likelihood_dist(x, m, initial_delta)
    p_theta_D_posterior *= p_theta
    posteriors.append(p_theta_D_posterior)

posteriors = np.array(posteriors) / np.sum(posteriors)


np.sum(posteriors)

1.0000000000000002


fig, ax = plt.subplots(figsize=(10, 6))
ax.plot(mu, posteriors, linewidth=4)
ax.set_xlabel(r"$\theta$", size=14)
ax.set_ylabel(r"$p(\theta|D) = p(\mu|D)$", size=14)
plt.show()


X = np.arange(-3, 3.5, 0.001)
Y = []

for x in X:
    p_x_D = 0
    for m, p in zip(mu, posteriors):
        p_x_D += likelihood_dist(x, m, initial_delta) * p
    Y.append(p_x_D)

Y /= np.sum(Y)


fig, ax = plt.subplots(figsize=(10, 6))
ax.plot(X, Y, linewidth=4)
ax.set_xlabel(r"$x$", size=14)
ax.set_ylabel(r"$p(x|D)$", size=14)
plt.show()


np.sum(Y)

0.9999999999999999


f"Mean of {D} = {np.mean(D):.4f}"

'Mean of [0.58  0.27  0.055 0.53  0.47  0.69  0.55  0.61  0.49  0.054] = 0.4299'


f"Peak at x = {X[np.argmax(Y)]:.4f}"

'Peak at x = 0.4330'


mu_hat = mu[np.argmax(posteriors)]
answer("\hat{\mu}", mu_hat)


delta = np.arange(-0.3, 1.001, 0.001)


U_a = 0
U_b = D.max() - D.min()


pTheta = [prior_dist(d, U_a, U_b) for d in delta]
pTheta /= np.sum(pTheta)


fig, ax = plt.subplots()
X = delta
Y = pTheta
ax.plot(X, Y, linewidth=4)
ax.set_xlabel(r"$\theta$")
ax.set_ylabel(r"$p(\theta)$")
plt.show()


np.sum(pTheta)

1.0


posteriors = []
for d, p_theta in zip(delta, pTheta):
    p_theta_D_posterior = 1
    for x in D:
        p_theta_D_posterior *= likelihood_dist(x, mu_hat, d)
    p_theta_D_posterior *= p_theta
    posteriors.append(p_theta_D_posterior)

posteriors = np.array(posteriors) / np.sum(posteriors)


np.sum(posteriors)

1.0


fig, ax = plt.subplots(figsize=(10, 6))
ax.plot(delta, posteriors, linewidth=4)
ax.set_xlabel(r"$\delta$", size=14)
ax.set_ylabel(r"$p(\theta|D) = p(\delta|D)$", size=14)
plt.show()


delta_hat = delta[np.argmax(posteriors)]
answer("\hat{\delta}", delta_hat)


X = np.arange(-1.5, 2.5, 0.001)
Y = []

for x in X:
    p_x_D = 0
    for d, p in zip(delta, posteriors):
        p_x_D += likelihood_dist(x, mu_hat, d) * p
    Y.append(p_x_D)

Y /= np.sum(Y)


fig, ax = plt.subplots(figsize=(10, 6))
ax.plot(X, Y, linewidth=4)
ax.set_xlabel(r"$x$", size=14)
ax.set_ylabel(r"$p(x|D)$", size=14)
plt.show()


np.sum(Y)

0.9999999999999998


answer("\hat{\mu}", mu_hat)
answer("\hat{\delta}", delta_hat)


def ln(x):
    return np.nan_to_num(np.log(x))

def desired_class_conditional_density(x, x_max, delta_max):
    return (delta_max * (ln(delta_max) - 1/2)) - ((x_max - x) * ln(x_max - x)) - ((x - x_min) * ln(x - x_min)) + delta_max + (((x_max - x)**2 + (x - x_min)**2) / (2 * delta_max))


x_min = D.min()
x_max = D.max()
delta_max = x_max - x_min

X = np.arange(D.min(), D.max(), 0.01)
Y = [desired_class_conditional_density(x, x_max, delta_max) for x in X]

<ipython-input-66-1e76a9e6f744>:2: RuntimeWarning: divide by zero encountered in log
  return np.nan_to_num(np.log(x))


fig, ax = plt.subplots(figsize=(10, 6))
ax.plot(X, Y, linewidth=4)
ax.set_xlabel(r"$x$", size=14)
ax.set_ylabel(r"$\frac{p(x|D)}{\alpha}$", size=18)
plt.show()


x_hat = X[np.argmax(Y)]
answer(r"\hat{x}", x_hat)

Mini Project 4

Watchanan Chantapakul (`wcgzm`)

Questions 1¶

(a)¶

(b)¶

(c)¶

(d)¶

(e) Compare your results for the mean of each feature $\mu_i$ calculated in the above ways. Explain why they are the same or different.¶

(f) Compare your results for the variance of each feature $\sigma_i^2$ calculated in the above ways. Explain way they are the same or different.¶

Question 2¶

Get the feature $x_2$ from $\omega_2$¶

[METHOD 1]¶

Triangular Density¶

Try plotting a triangular density¶

Uniform Distribution¶

Try plotting a uniform distribution¶

Bayesian estimation (BE)¶

1) Estimate $\mu$ by fixing $\delta = 2$¶

A Priori Density $p(\theta) = p(\mu)$¶

Compute $p(\theta|D) = p(\mu|D)$¶

Posterior density $p(x|D)$ after estimating $\mu$¶

2) Estimate $\delta$ by fixing $\mu$¶

A Priori Density $p(\theta) = p(\delta)$¶

Compute $p(\theta|D) = p(\delta|D)$¶

Posterior density $p(x|D)$ after estimating $\delta$¶

The estimated parameters¶

[METHOD 2] Estimating two parameters at the same time¶

Mini Project 4

Watchanan Chantapakul (wcgzm)

Questions 1¶

(a)¶

(b)¶

(c)¶

(d)¶

(e) Compare your results for the mean of each feature $\mu_i$ calculated in the above ways. Explain why they are the same or different.¶

(f) Compare your results for the variance of each feature $\sigma_i^2$ calculated in the above ways. Explain way they are the same or different.¶

Question 2¶

Get the feature $x_2$ from $\omega_2$¶

[METHOD 1]¶

Triangular Density¶

Try plotting a triangular density¶

Uniform Distribution¶

Try plotting a uniform distribution¶

Bayesian estimation (BE)¶

1) Estimate $\mu$ by fixing $\delta = 2$¶

A Priori Density $p(\theta) = p(\mu)$¶

Compute $p(\theta|D) = p(\mu|D)$¶

Posterior density $p(x|D)$ after estimating $\mu$¶

2) Estimate $\delta$ by fixing $\mu$¶

A Priori Density $p(\theta) = p(\delta)$¶

Compute $p(\theta|D) = p(\delta|D)$¶

Posterior density $p(x|D)$ after estimating $\delta$¶

The estimated parameters¶

[METHOD 2] Estimating two parameters at the same time¶

Watchanan Chantapakul (`wcgzm`)