import numpy as np
from scipy.stats import beta as Beta, binom, norm, rv_continuous
from scipy.special import gamma
from matplotlib import pyplot as plt
from tqdm.notebook import tqdm
np.random.seed(42)


mu = 5
n = 100
X = norm.rvs(loc=mu, scale=1, size=n)


X_bar = np.mean(X)
sigma = np.sqrt(1/n)
XX = np.arange(4, 6, .01)
plt.plot(XX, norm.pdf(XX, loc=X_bar, scale=sigma))
plt.title("Posterior Density for $\mu$")
plt.grid()
plt.show()


k = 1000
mu_post = norm.rvs(loc=X_bar, scale=sigma, size=k)
plt.plot(XX, norm.pdf(XX, loc=X_bar, scale=np.sqrt(1/n)), label='Posterior Density')
plt.hist(mu_post, bins=30, histtype='step', density=True, label='(Normalized) Histogram of Draws')
plt.grid()
plt.legend(loc='upper right')
plt.show()


TT = np.arange(100, 200, .1)
theta_post = norm.pdf((np.log(TT) - X_bar) / np.sqrt(1/n)) * (1 / (TT * np.sqrt(1/n)))
plt.plot(TT, theta_post)
theta_post = np.exp(mu_post)
plt.hist(theta_post, bins=30, histtype='step', density=True, label='(Normalized) Histogram of Draws')
plt.grid()
plt.legend()
plt.show()


alpha = 0.05
z = norm.ppf(1 - alpha/2)
print(f"{100 *(1-alpha):.0f}% C.I. for mu: ({X_bar - (1/np.sqrt(n)) * z:.3f}, {X_bar + (1/np.sqrt(n)) * z:.3f})")

95% C.I. for mu: (4.700, 5.092)


print(f"{100 *(1-alpha):.0f}% C.I. for theta: " \
      f"({np.exp(X_bar - (1/np.sqrt(n)) * z):.3f}," \
      f" {np.exp(X_bar + (1/np.sqrt(n)) * z):.3f})")

95% C.I. for theta: (109.964, 162.739)


print(f"{100 *(1-alpha):.0f}% C.I. for theta: " \
      f"({np.quantile(theta_post, 0.025):.3f}," \
      f" {np.quantile(theta_post, 0.975):.3f})")

95% C.I. for theta: (111.968, 164.394)


B = 100000
p_1_hat = 3 / 5
p_2_hat = 4 / 5
tau_hat = p_2_hat - p_1_hat
tau_boot = np.empty(B)
for i in range(B):
    p_1_boot = binom.rvs(n=50, p=p_1_hat) / 50
    p_2_boot = binom.rvs(n=50, p=p_2_hat) / 50
    tau_boot[i] = p_2_boot - p_1_boot
se_boot = np.std(tau_boot)
z = norm.ppf(1-0.05)
print(f"Standard error: {se_boot:.3f}")
print(f"90% C.I.: ({tau_hat - z * se_boot:.3f},{tau_hat + z * se_boot:.3f})")

Standard error: 0.089
90% C.I.: (0.053,0.347)


k = 100000
p_1_samples = Beta.rvs(a=31, b=21, size=k)
p_2_samples = Beta.rvs(a=41, b=11, size=k)
tau_samples = p_2_samples - p_1_samples


print(f"Simulated posterior mean: {np.mean(tau_samples):.3f}")
print(f"90% C.I.: " \
      f"({np.quantile(tau_samples, 0.05):.3f}," \
      f" {np.quantile(tau_samples, 0.95):.3f})")

Simulated posterior mean: 0.193
90% C.I.: (0.047, 0.336)


psi_hat = np.log((p_1_hat / (1 - p_1_hat)) / (p_2_hat / (1 - p_2_hat)))
z = norm.ppf(1-0.05)
print(f"90% C.I.: ({psi_hat - z * np.sqrt(30)/12:.3f}, {psi_hat + z * np.sqrt(30)/12:.3f})")

90% C.I.: (-1.732, -0.230)


psi_samples = np.log((p_1_samples / (1 - p_1_samples)) / (p_2_samples / (1 - p_2_samples)))
print(f"Posterior mean: {np.mean(psi_samples):.3f}")
print(f"90% C.I.: ({np.quantile(psi_samples, 0.05):.3f}, "
      f"{np.quantile(psi_samples, 0.95):.3f})")

Posterior mean: -0.954
90% C.I.: (-1.705, -0.226)


p_hat = 2 / 10
alphas = [.5, 1, 10, 100]
betas = [.5, 1, 10, 100]
X = np.arange(0, 1, 0.01)
fig, (ax1, ax2) = plt.subplots(nrows=1, ncols=2, figsize=(12, 6))
for alpha, beta in zip(alphas, betas):
    ax1.plot(X, Beta.pdf(X, alpha, beta))
    ax2.plot(X, Beta.pdf(X, alpha + 2, beta + 8), label=f"a={alpha}, b={beta}")
ax1.set_title("Prior Distributions")
ax2.set_title("Posterior Distributions")
ax2.vlines(p_hat, 0, 12, linestyle='--', color='black', label='MLE')
ax1.grid(True)
ax2.grid(True)
ax2.legend()
plt.show()


for n in [10, 100, 1000]:
    X = norm.rvs(loc=0.1, scale=1, size=n)
    X_bar = X.mean()
    p_value = 2 * norm.cdf(-np.sqrt(n) * np.abs(X_bar))
    
    print(f"n = {n}, p-value: {p_value:.3f}")
    b = np.logspace(-4, 5, num=50, base=10)
    
    sigma_2 = b ** 2 / (1 + n * (b ** 2))
    z = (np.sqrt(sigma_2) / b) * np.exp(( np.sqrt(sigma_2) * n * X_bar) ** 2 / 2)
    posterior = 1 / (1 + z)

    plt.plot(b, posterior, label=f"n={n}")
    plt.xscale('log')
    plt.xlabel('b')
    plt.ylabel("Posterior Probability of $H_0$")
plt.legend()
plt.grid()
plt.show()

n = 10, p-value: 0.008
n = 100, p-value: 0.193
n = 1000, p-value: 0.000

1¶

2¶

3¶

4¶

5¶

6¶

7¶

8¶