import math

from matplotlib import pyplot as plt
import numpy as np
import pandas as pd
from scipy.stats import norm, chi2, beta as Beta

plt.style.use("default.mplstyle")


def get_polynomial(x, coefficients):
    yy = np.zeros(len(x))
    for order, value in enumerate(coefficients):
        yy += value * np.power(x, order)
    return yy

legendre_coefficients = {"P_0": [1],
                         "P_1": [0, 1],
                         "P_2": [-1/2, 0, 3/2],
                         "P_3": [0, -3/2, 0, 5/2],
                         "P_4": [3/8, 0, -30/8, 0, 35/8]}

fig = plt.figure(figsize=(10, 6))
x = np.linspace(-1, 1, 100)
for j, (key, coefs) in enumerate(legendre_coefficients.items()):
    normalized_coefs = np.array(coefs) * math.sqrt((2 * j + 1) / 2) # normalize
    y = get_polynomial(x, normalized_coefs) 
    plt.plot(x, y, label=f"${key}(x)$")
plt.legend()
plt.show()


N = int(1e6)
x = np.linspace(-1, 1, N + 1)
for j_a, (key_a, value_a) in enumerate(legendre_coefficients.items()):
    value_a = np.array(value_a) * math.sqrt((2 * j_a + 1) / 2) # normalization
    for j_b, (key_b, value_b) in enumerate(legendre_coefficients.items()):
        if key_b > key_a:
            value_b = np.array(value_b) * math.sqrt((2 * j_b + 1) / 2) # normalization
            y_a = get_polynomial(x, value_a)
            y_b = get_polynomial(x, value_b)
            print(f"<{key_a},{key_b}> =  {(2 / (N)) * np.sum(y_a * y_b):.3f}")

<P_0,P_1> =  -0.000
<P_0,P_2> =  0.000
<P_0,P_3> =  -0.000
<P_0,P_4> =  0.000
<P_1,P_2> =  -0.000
<P_1,P_3> =  0.000
<P_1,P_4> =  -0.000
<P_2,P_3> =  -0.000
<P_2,P_4> =  0.000
<P_3,P_4> =  -0.000


def f_a(x):
    return np.sqrt(2) * np.cos(3 * np.pi * x)

def f_b(x):
    return np.sin(np.pi * x)
    
t = np.array([.1, .13, .15, .23, .25, .40, .44, .65, .76, .78, .81])
h = np.array([4, -5, 3, -4, 5, -4.2, 2.1, 4.3, -3.1, 2.1, -4.2])

def f_c(x):
    return np.sum((np.sign(x - np.repeat(np.reshape(t, [-1, 1]), len(x), axis=1)) / 2).T * h, axis=1)

def f_d(x):
    return np.sqrt(x * (1 - x)) * np.sin(2.1 * np.pi / (x + 0.05))

def beta_function_a(j):
    return 1 if j == 3 else 0

def beta_function_b(j):
    if j == 0:
        return 2 / np.pi
    elif j == 1:
        return 0
    else:
        return (math.sqrt(2) * (np.cos(np.pi * j) + 1)) / (np.pi * (1 - j ** 2))


def cosine_phi(x, j):
    """cosine basis function on [0,1]"""
    if j == 0:
        return np.ones(len(x))
    else:
        return math.sqrt(2) * np.cos(j * np.pi * x)


class orthogonal_function_estimator():
    def __init__(self, f, phi, beta_function=None):
        self.f = f
        self.phi = phi
        N = 10000 # size of mesh
        n = 1028 # number of coefficients to compute

        self.beta = {}
        if beta_function is None:
            inputs = np.linspace(0, 1, N)
            for j in range(n):
                self.beta[j] = (1 / N) * np.sum(f(inputs) * self.phi(inputs, j))
        else:
            for j in range(n):
                self.beta[j] = beta_function(j)


    def plot_f(self):
        xx = np.linspace(0, 1, N)
        plt.plot(xx, self.f(xx), label=f"$f(x)$")

    def plot_phi(self, k):
        xx = np.linspace(0, 1, N)
        plt.plot(xx, phi(xx, k), label=f"$\phi_k(x)$")

    def partial_sum(self, x, J):
        y = np.zeros(len(x))
        for j in range(0, J):
            y = y + (self.beta[j] * self.phi(x, j))
        return y
    
    def plot(self):
        _, ax = plt.subplots(nrows=1, ncols=4, figsize=(20,4))
        xx = np.linspace(0, 1, N)
        ax[0].plot(xx, self.f(xx))
        ax[0].set_title("$f(x)$")
        y_min = min(np.array(self.f(xx))) * 1.5
        y_max = max(np.array(self.f(xx))) * 1.5
        ax[0].set_ylim(y_min, y_max)
        for index, J in enumerate([16, 64, 512]):
            ax[index + 1].plot(xx, self.partial_sum(xx, J))
            ax[index + 1].set_title("$\hat{f}$" + f"$[{J}](x)$")
            ax[index + 1].set_ylim(y_min, y_max)
        plt.show()


ofe = orthogonal_function_estimator(f_a, cosine_phi, beta_function_a)
ofe.plot()


ofe = orthogonal_function_estimator(f_b, cosine_phi, beta_function_b)
ofe.plot()


ofe = orthogonal_function_estimator(f_c, cosine_phi)
ofe.plot()


ofe = orthogonal_function_estimator(f_d, cosine_phi)
ofe.plot()


data = pd.read_csv("data/glass.dat", sep="\s+", usecols=["RI", "Al"])
Y = data["RI"].values
X = data["Al"].values
sorted_indices = X.argsort()
X = X[sorted_indices]
Y = Y[sorted_indices]
X = (X - min(X)) / (max(X) - min(X))


class orthogonal_function_regressor():
    
    def __init__(self, x, y, phi):
        self.x = x
        self.y = y
        self.phi = phi
        self.n = 1000
        self.beta = {}
        for j in range(self.n):
            self.beta[j] = np.mean(y * self.phi(x, j))

        self.k = int(self.n / 4)
        self.sigma_2_hat = (self.n / self.k) * np.sum(np.power(np.array([self.beta[j] for j in range(self.n-self.k+1, self.n)]), 2))

    def risk_estimate(self, J):
        R = (J * self.sigma_2_hat / self.n)
        betas = np.array([self.beta[j] for j in range(J+1, self.n)])
        terms =  np.power(betas, 2) - self.sigma_2_hat / self.n
        positive_terms = np.where(terms > 0, terms, 0)
        R += np.sum(positive_terms)
        return R

    def partial_sum(self, x, J, confidence_band=False):
        
        y = np.zeros(len(x))
        for j in range(0, J):
            y = y + (self.beta[j] * self.phi(x, j))

        if confidence_band:
            a = np.sqrt(np.sum([np.power(ofr.phi(x, j), 2) for j in range(5)], axis=0))
            c = (a * np.sqrt(self.sigma_2_hat) * chi2.ppf(0.05, df=J)) / np.sqrt(self.n)
            l = y - c
            u = y + c
            return y, l, u
        else:
            return y
        
ofr = orthogonal_function_regressor(X, Y, cosine_phi)

Js = np.arange(20)
plt.plot(Js, [ofr.risk_estimate(j) for j in Js], linewidth=1)
plt.xticks(Js)
plt.xlabel("$J$")
plt.ylabel("Estimated Risk")
plt.show()

xx = np.linspace(min(X), max(X), 1000)
plt.scatter(X, Y, alpha=0.25)
y, l, u = ofr.partial_sum(xx, 6, confidence_band=True)
plt.plot(xx, y, label="Orthogonal Function Regressor (J=6)")
plt.plot(xx, l, color='orange')
plt.plot(xx, u, color='orange', label="95% Confidence Band")
plt.xlabel("Aluminum Content")
plt.ylabel("Refractive Index")
plt.legend()
plt.show()

print(f"Estimated Risk: {ofr.risk_estimate(6):.3f}")

Estimated Risk: 25.075


def haar_phi(x):
    return (np.where(((0 <= x) & (x < 1)), 1, 0)).astype(np.float64)

def haar_psi(x):
    return np.where((x >= 0) & (x < 1), np.where((x < 1/2), -1, 1), 0)

def haar_psi_jk(x, j, k):
    return (2 ** (j / 2)) * haar_psi(((2 ** j) * x) - k)

n = len(X)
alpha_hat = (haar_phi(X) @ Y) / n
J = int(np.ceil(np.log2(n)))
D = {}
for j in range(J):
    for k in range(0, int(2 ** (J))):
        D[j,k] = (haar_psi_jk(X, j, k) @ Y) / n

# universal thresholding
D_values = np.array([D[J - 1, k] for k in range(0, int(2 ** (J)))])
sigma_hat = np.median(np.abs(D_values)) / 0.6745
for j in range(J):
    for k in range(0, int(2 ** (J ))):
        if np.abs(D[j,k]) <= sigma_hat * np.sqrt(2 * np.log(n) / n):
            D[j,k] = 0

x = np.linspace(0, 1, 1000)
partial_sum = alpha_hat * haar_phi(x)
for j in range(J):
    for k in range(0, int((2 ** (J)))):
        partial_sum += D[j,k] * haar_psi_jk(x, j, k)

plt.scatter(X,Y, alpha=0.5)
plt.plot(x, partial_sum)
plt.show()


N = 1_024
sigma = 0.1
x = np.arange(1 / N, 1 + 1/N, 1/N)
eps = norm.rvs(size=N)
Y = f_d(x) + sigma * eps


# fitting using cosine basis method

def cosine_phi(x, j):
    if j == 0:
        return np.ones(len(x))
    else:
        return math.sqrt(2) * np.cos(j * np.pi * x)
    
ofr = orthogonal_function_regressor(x, Y, cosine_phi)
Js = np.arange(10, 110, 10)
fig, ax = plt.subplots(nrows=2, ncols=5, figsize=(22,8))
ax = ax.flatten()
for index, J in enumerate(Js):
    xx = np.linspace(0, 1, 1000)
    y_est, lb, ub = ofr.partial_sum(xx, J=J, confidence_band=True)
    ax[index].plot(xx, y_est, color='blue')
    ax[index].plot(xx, lb, color='orange')
    ax[index].plot(xx, ub, color='orange')
    ax[index].set_ylim(-1, 1)
    ax[index].set_title(f"J={J}")
    ax[index].grid(False)
    ax[index].set_yticks([])


# computing the coefficients using the DWT for Haar Wavelets
n = len(Y)
J = int(np.ceil(np.log2(n)))
D = {x: None for x in range(J)}
temp = Y / np.sqrt(n)
for j in range(J - 1, -1, -1):
    m = 2 ** j
    I = np.array(list(range(1, m + 1))).astype(int)
    D[j] = ((temp[2 * I - 1] - temp[np.array(2 * I) - 2]) / np.sqrt(2))
    temp = (temp[2 * I - 1] + temp[np.array(2 * I) - 2]) / np.sqrt(2)

# applying universal thresholding
D_values = np.array([D[J-1][k] for k in range(0, int(2 ** (J-1)))])
sigma_hat = np.sqrt(n) * np.median(np.abs(D_values)) / 0.6745
for j in range(J):
    for k in range(0, int(((2 ** (j))))):
        if np.abs(D[j][k]) <= sigma_hat * np.sqrt(2 * np.log(n) / n):
            D[j][k] = 0

# computing the approximation
xx = np.linspace(0, 1, 1_000)
alpha_hat = (haar_phi(x) @ Y) / n
partial_sum = alpha_hat * haar_phi(xx)
for j in range(J):
    for k in range(0, int(2 ** j)):
        partial_sum = partial_sum + D[j][k] * haar_psi_jk(xx, j, k)

plt.scatter(x, Y, alpha=0.03)
plt.plot(xx, partial_sum)

[<matplotlib.lines.Line2D at 0x7f0bc7e433d0>]


def haar_histogram(X, B):

    def compute_beta(x):
        beta = {}
        for j in range(B + 1):
            for k in range(2 ** j):
                beta[j,k] = np.sum(haar_psi_jk(x, j, k)) / n
        return beta
    
    beta = compute_beta(X)

    def f_hat(z):
        f_hat = haar_phi(z).astype(np.float64)
        for j in range(B + 1):
            for k in range(2 ** j):
                f_hat += beta[j,k] * haar_psi_jk(z, j, k)
        return f_hat
        
    return f_hat

n = 1_000
J = np.round(np.log2(n)).astype(int)
X = Beta.rvs(a=15, b=4, size=n)
f_hat = haar_histogram(X, 4)

step = 1e-4
xx = np.arange(0, 1 + step, step)
plt.plot(xx, f_hat(xx))
plt.show()


def risk_of_haar_histogram(X, B):
    f_hat = haar_histogram(X, B)
    xx = np.arange(0, 1 + step, step)
    second_moment = np.sum((f_hat(xx) ** 2) * step)
    return second_moment - (2 / n) * np.sum([haar_histogram(np.delete(X, i), B)(X[i]) for i in range(n)])

risk = {}
for B in range(J+1):
    risk[B] = risk_of_haar_histogram(X, B)


plt.plot(risk.keys(), risk.values())
plt.xlabel("$B$")
plt.ylabel("$\hat{J}$", rotation=0)
plt.title("Risk of Haar Histogram by $B$")

print(f"Risk minimizer: B={np.argmin(list(risk.values()))}")

Risk minimizer: B=4


plt.figure(figsize=(20, 8))
for index, B in enumerate(range(J)):
    f_hat = haar_histogram(X, B)
    ax = plt.subplot(2, 5, index + 1)
    ax.plot(xx, f_hat(xx))
    ax.grid(False)
    ax.set_title(f"$B = {B}$, $J = {risk[B]:.3f}$")
plt.show()


n = 100
k = 1000
X = norm.rvs(size=(n, k))

sigma_hat_old = np.sum(np.power(X - np.mean(X, axis=0), 2), axis=0) / (n - 1)
sigma_hat_new = np.median(np.abs(X), axis=0) / 0.6745

mse_old = np.mean(np.power(sigma_hat_old - 1, 2))
mse_new = np.mean(np.power(sigma_hat_new - 1, 2))

print(f"MSE of old estimate: {mse_old:.4f}")
print(f"MSE of new estimate: {mse_new:.4f}")

MSE of old estimate: 0.0195
MSE of new estimate: 0.0132


rand_ints = np.random.randint(0, 100, size=(n, k))
mask_5_percent = rand_ints < 5
normal_1 = norm.rvs(0, 1, size=(n, k))
normal_10 = norm.rvs(0, 10, size=(n, k))
X = np.where(mask_5_percent, normal_10, normal_1)

sigma_hat_old = np.sum(np.power(X - np.mean(X, axis=0), 2), axis=0) / (n - 1)
sigma_hat_new = np.median(np.abs(X), axis=0) / 0.6745

mse_old = np.mean(np.power(sigma_hat_old - 1, 2))
mse_new = np.mean(np.power(sigma_hat_new - 1, 2))

print(f"MSE of old estimate: {mse_old:.4f}")
print(f"MSE of new estimate: {mse_new:.4f}")

MSE of old estimate: 41.2768
MSE of new estimate: 0.0183


def beta_function_a(j, k):
    first_term = np.sin(3 * np.pi * (k + 1) * 2 ** (-j))
    second_term = - 2 * np.sin(3 * np.pi * (k + 0.5) * 2 ** (-j))
    third_term = np.sin(3 * np.pi * (k) * 2 ** (-j))
    return (2 ** ((j + 1) / 2)/ (3 * np.pi)) * (first_term + second_term + third_term)
    
def wavelet_regressor(f, father_wavelet, daughter_wavelet, alpha=None, beta_function=None):
    beta = {}
    J = 6
    z = np.arange(0, 1, 1e-4)
    Y = f(z)
    if beta_function is None:
        alpha = (Y @ father_wavelet(z)) / len(Y)

    for j in range(J + 1):
        for k in range(2 ** j):
            if beta_function is None:
                beta[j,k] = (Y @ daughter_wavelet(z, j, k)) / len(Y)
            else:
                beta[j, k] = beta_function(j, k)
    
    def f_hat(x):
        result = alpha * father_wavelet(x)
        for j in range(J + 1):
            for k in range(2 ** j):
                result += beta[j, k] * daughter_wavelet(x, j, k)
        return result
    return f_hat

f_hat = wavelet_regressor(f_a, haar_phi, haar_psi_jk, alpha=0, beta_function=beta_function_a)
xx = np.arange(0, 1, 1e-4)
plt.plot(xx, f_hat(xx))

[<matplotlib.lines.Line2D at 0x7f0bc7e5ad60>]


def beta_function_b(j,k):
    return ((2 ** (j / 2)) / np.pi) \
        * (2 * np.cos(((k + (1/2)) * np.pi)/(2 ** j)) \
        - np.cos(k * np.pi / (2 ** j)) - np.cos(((k + 1) * np.pi)/(2 ** j)))

f_hat = wavelet_regressor(f_b, haar_phi, haar_psi_jk, alpha = (2 / np.pi), beta_function=beta_function_b)

xx = np.arange(0, 1, 1e-4)
plt.plot(xx, f_hat(xx))

[<matplotlib.lines.Line2D at 0x7f0bcc24ab50>]


f_hat = wavelet_regressor(f_c, haar_phi, haar_psi_jk)
xx = np.arange(0, 1, 1e-4)
plt.plot(xx, f_hat(xx))

[<matplotlib.lines.Line2D at 0x7f0bcdf23610>]


f_hat = wavelet_regressor(f_d, haar_phi, haar_psi_jk)
xx = np.arange(0, 1, 1e-4)
plt.plot(xx, f_hat(xx))

[<matplotlib.lines.Line2D at 0x7f0bd05ff970>]

1¶

2¶

3¶

4¶

5¶

6¶

7¶

8¶

9¶

10¶

11¶

12¶