import math

import numpy as np
import pandas as pd
from numpy.random import default_rng

rng = default_rng(42)
import matplotlib as mpl
import plotly.graph_objects as go
from matplotlib import pyplot as plt
from scipy.stats import binom, chi2, norm
from tqdm.notebook import tqdm

mpl.rcParams["font.size"] = 18


theta_0 = 0.5  # parameter in null hypothesis

n = 1919
after = 997

theta_hat = after / n
se_hat = math.sqrt(theta_hat * (1 - theta_hat) / n)
w = (theta_hat - theta_0) / se_hat

p = 2 * norm.cdf(-np.abs(w))
print(f"p-value: {p:.3f}")

alpha = 0.05
z = norm.ppf(1 - alpha / 2)
print(
    f"{100 * (1 - alpha):.0f}% Confidence Interval: ({theta_hat - z * se_hat:.3f}, {theta_hat + z * se_hat:.3f})"
)

p-value: 0.087
95% Confidence Interval: (0.497, 0.542)


twain = np.array([0.225, 0.262, 0.217, 0.240, 0.230, 0.229, 0.235, 0.217])
snodgrass = np.array(
    [0.209, 0.205, 0.196, 0.210, 0.202, 0.207, 0.224, 0.223, 0.220, 0.201]
)

m = twain.size
n = snodgrass.size
delta_hat = np.mean(twain) - np.mean(snodgrass)
print(f"delta_hat: {delta_hat:.3f}")
s_1 = np.std(twain, ddof=1)
s_2 = np.std(snodgrass, ddof=1)
se_hat = math.sqrt((s_1**2) / m + (s_2**2) / n)

w = delta_hat / se_hat
p = 2 * norm.cdf(-np.abs(w))
print(f"p-value: {p:.4f}")
alpha = 0.05
z = norm.ppf(1 - alpha / 2)
print(
    f"{100 * (1 - alpha):.0f}% Confidence Interval: ({delta_hat - z * se_hat:.3f}, {delta_hat + z * se_hat:.3f})"
)

delta_hat: 0.022
p-value: 0.0002
95% Confidence Interval: (0.010, 0.034)


def T(data):
    return np.mean(data[:m]) - np.mean(data[m:])


data = np.concatenate([twain, snodgrass])
t_obs = T(data)

B = 100000  # number of permutations to sample
count = 0
for i in range(B):
    permutation = rng.permutation(data)
    t_test = T(permutation)
    if t_test > t_obs:
        count += 1
p = count / B
print(f"p-value: {p:.6f}")

p-value: 0.000440


df = pd.DataFrame(
    {
        "Week": [-2, -1, 1, 2],
        "Chinese": [55, 33, 70, 49],
        "Jewish": [141, 145, 139, 161],
    }
)
df.set_index("Week", inplace=True)
before = [-2, -1]
after = [1, 2]
chinese_before, jewish_before = df.loc[before].sum().values
chinese_after, jewish_after = df.loc[after].sum().values


p_1_hat = chinese_after / (chinese_before + chinese_after)
p_2_hat = jewish_after / (jewish_before + jewish_after)
delta_hat = p_1_hat - p_2_hat

n_1 = df["Chinese"].sum()
n_2 = df["Jewish"].sum()
se_hat = math.sqrt((p_1_hat * (1 - p_1_hat) / n_1) + (p_2_hat * (1 - p_2_hat) / n_2))

w = delta_hat / se_hat
p = 2 * norm.cdf(-np.abs(w))
print(f"p-value: {p:.4f}")
alpha = 0.05
z = norm.ppf(1 - alpha / 2)
print(
    f"{100 * (1 - alpha):.0f}% Confidence Interval: ({delta_hat - z * se_hat:.3f}, {delta_hat + z * se_hat:.3f})"
)

p-value: 0.1164
95% Confidence Interval: (-0.016, 0.142)


mu_chinese_hat = (1 / 2) * n_1
t_pearson_chinese = (chinese_before - mu_chinese_hat) ** 2 / (mu_chinese_hat) + (
    chinese_after - mu_chinese_hat
) ** 2 / (mu_chinese_hat)
critical_value = chi2.ppf(q=0.95, df=1)
p_value = 1 - chi2.cdf(t_pearson_chinese, 1)
print(f"Test Statistic: {t_pearson_chinese:.3f}")
print(
    f"95th percentile for chi squared with one degree of freedom: {critical_value:.3f}"
)
print(f"p-value: {p_value:.3f}")

Test Statistic: 4.643
95th percentile for chi squared with one degree of freedom: 3.841
p-value: 0.031


mu_jewish_hat = (1 / 2) * n_2
t_pearson_jewish = (jewish_before - mu_jewish_hat) ** 2 / (mu_jewish_hat) + (
    jewish_after - mu_jewish_hat
) ** 2 / (mu_jewish_hat)
critical_value = chi2.ppf(q=0.95, df=1)
p_value = 1 - chi2.cdf(t_pearson_jewish, 1)
print(f"Test Statistic: {t_pearson_jewish:.3f}")
print(
    f"95th percentile for chi squared with one degree of freedom: {critical_value:.3f}"
)
print(f"p-value: {p_value:.3f}")

Test Statistic: 0.334
95th percentile for chi squared with one degree of freedom: 3.841
p-value: 0.563


theta_hat = np.array([88, 119, 286, 300]) / 793
theta_hat_0 = np.array([103.5, 103.5, 293, 293]) / 793
_lambda = 2 * np.sum(
    [theta_hat[i] * 793 * math.log(theta_hat[i] / theta_hat_0[i]) for i in range(4)]
)
critical_value = chi2.ppf(q=0.95, df=3)
p_value = 1 - chi2.cdf(_lambda, df=3)
print(f"Likelihood Ratio Statistic: {_lambda:.3f}")
print(
    f"95th percentile for chi squared with three degrees of freedom: {critical_value:.3f}"
)
print(f"p-value: {p_value:.3f}")

Likelihood Ratio Statistic: 4.995
95th percentile for chi squared with three degrees of freedom: 7.815
p-value: 0.172


from scipy.stats import binomtest

theta_0 = n_1 / (n_1 + n_2)
p_1 = binomtest(55, 55 + 141, theta_0, alternative="two-sided").pvalue
p_2 = binomtest(33, 33 + 145, theta_0, alternative="two-sided").pvalue
p_3 = binomtest(70, 70 + 139, theta_0, alternative="two-sided").pvalue
p_4 = binomtest(49, 49 + 161, theta_0, alternative="two-sided").pvalue

results = pd.DataFrame({"p-value": [p_1, p_2, p_3, p_4]}, index=[-2, -1, 1, 2])
results


df = pd.DataFrame(
    data={
        "Number of Patients": [80, 75, 85, 67, 85],
        "Incidence of Nausea": [45, 26, 52, 35, 37],
    },
    index=[
        "Placebo",
        "Chlorpromazine",
        "Dimenhydrinate",
        "Pentobarbital (100 mg)",
        "Pentobarbital (150 mg)",
    ],
)


alpha = 0.05
df['p_hat'] = df['Incidence of Nausea'] / df['Number of Patients']
p_0 = df.loc['Placebo']['p_hat']
n_0 = df.loc['Placebo']['Number of Patients']
df['se_hat'] = (df['p_hat'] * (1 - df['p_hat']) / df['Number of Patients'] + p_0 * (1 - p_0) / n_0) ** (1 / 2)
df['delta_hat'] = df['p_hat'] - p_0
df['w'] = df['delta_hat'] / df['se_hat']
df['p_value'] = 2 * norm.cdf(-abs(df['w']))
z = norm.ppf(1 - alpha / 2)
df['Reject Null'] = df['p_value'] <= alpha
# se_hat = math.sqrt(p_hat * (1 - p_hat) /)
df['Estimated Odds'] = df['Incidence of Nausea'] / (df['Number of Patients'] - df['Incidence of Nausea'])
df['Estimated Odds Ratio'] = (45 / 35) / df['Estimated Odds']


df[['p_hat', 'p_value', 'Reject Null', 'Estimated Odds Ratio']]


m = 4 # four different hypothesis tests
df['Reject Null (Bonferroni)'] = df['p_value'] < alpha / m
df['Reject Null (Bonferroni)']

Placebo                   False
Chlorpromazine             True
Dimenhydrinate            False
Pentobarbital (100 mg)    False
Pentobarbital (150 mg)    False
Name: Reject Null (Bonferroni), dtype: bool


ordered_p_values = np.sort(df['p_value'].values)
C_m = sum([(1 / i) for i in range(1, m + 1)])   # p-values are not independent, since they all
                                                # depend on the placebo data
l = [(i * alpha) / (C_m * m) for i in range(1, m + 1)]
R = max([i for i in range(m) if ordered_p_values[i] < l[i]])
T = ordered_p_values[R]


df['Reject Null (Benjamini-Hochberg)'] = df['p_value'] <= T
df['Reject Null (Benjamini-Hochberg)']

Placebo                   False
Chlorpromazine             True
Dimenhydrinate            False
Pentobarbital (100 mg)    False
Pentobarbital (150 mg)    False
Name: Reject Null (Benjamini-Hochberg), dtype: bool


lambda_0 = 1
n = 20
k = 1000000
alpha = 0.05
z = norm.ppf(1 - alpha / 2)


np.random.seed(42)
X = np.random.poisson(lam=lambda_0, size=(n, k))
X_bar = np.mean(X, axis=0)
se = np.sqrt(X_bar / n)
W = (X_bar - lambda_0) / se
type_one_error_rate =  np.sum(np.abs(W) > z) / k
print(f"The type 1 error rate is {type_one_error_rate:.4f} ({k} trials).")

The type 1 error rate is 0.0524 (1000000 trials).


mu = math.pi
mu_0 = 3
sigma = math.e
n = 1000
k = 1000
alpha = 0.05
X = np.random.normal(loc=mu, scale=sigma, size=(n, k))
X_bar = np.mean(X, axis=0)
lam = ((mu_0 - X_bar) ** 2) / ((sigma ** 2) / n)
W = (mu_0 - X_bar) / math.sqrt(sigma ** 2 / n)
z_w = norm.ppf(1 - alpha / 2)
z_lr = chi2.ppf(1-alpha, df=1)

# Wald test and Likelihood ratio test give the same results:
assert(np.array_equal((np.abs(W) > z_w), (lam > z_lr)))


mu = 3
sigma_0 = 6
n = 1000
k = 10000
X = np.random.normal(loc=mu, scale=sigma_0, size=(n,k))
sigma_hat = np.sqrt(np.sum(np.power(X - mu, 2), axis=0) / n)
lam = n * (-2 * np.log(sigma_hat / sigma_0) + np.power(sigma_hat / sigma_0, 2) - 1)


Z = np.arange(0, 10, 0.1)
chi2_pdf = chi2.pdf(Z, df=1)
_ = plt.hist(lam, bins=50, histtype='step', density=True)
_ = plt.plot(Z, chi2_pdf)
_ = plt.ylim(0,1)


se_hat = sigma_hat / np.sqrt(2 * n)
W = (sigma_hat - sigma_0) / se_hat
Z = np.arange(-4, 4, 0.01)
norm_pdf = norm.pdf(Z, loc=0, scale=1)
_ = plt.hist(W, bins=100, histtype='step', density=True)
_ = plt.plot(Z, norm_pdf)

	p-value
-2	0.516380
-1	0.021061
1	0.017937
2	0.388072

	p_hat	p_value	Reject Null	Estimated Odds Ratio
Placebo	0.562500	1.000000	False	1.000000
Chlorpromazine	0.346667	0.005703	True	2.423077
Dimenhydrinate	0.611765	0.520232	False	0.815934
Pentobarbital (100 mg)	0.522388	0.626664	False	1.175510
Pentobarbital (150 mg)	0.435294	0.099639	False	1.667954

1¶

2¶

3¶

4¶

5¶

6¶

7¶

8¶

9¶

10¶

Wald Test for Difference of Proportions¶

Pearon's $\chi^2$ Test¶

Likelihood Ratio Test¶

Binomial Tests¶

11¶

12¶

13¶

14¶

15¶

16¶

Week	Chinese	Jewish
-2	55	141
-1	33	145
1	70	139
2	49	161

	Chinese	Jewish
Before	88	286
After	119	300