import matplotlib.pyplot as plt
import numpy as np
import pandas as pd
from scipy.special import expit
import sympy as sp
from tqdm import tqdm

pd.set_option("display.precision", 3)


from graphviz import Digraph

a = Digraph()
a.edge("X", "Y")
a.edge("Y", "Z")
a


b = Digraph()
b.edge("Z", "Y")
b.edge("Y", "X")
b


c = Digraph()
c.edge("Y", "X")
c.edge("Y", "Z")
c


g = Digraph()
g.edge("X", "Y")
g.edge("Z", "Y")
g


df = pd.DataFrame(
    [
        ["X", None, 0, None, 0.3],
        ["X", None, 1, None, 0.7],
        ["Y", "X", 0, 0, 0.1],
        ["Y", "X", 1, 0, 0.9],
        ["Y", "X", 0, 1, 0.75],
        ["Y", "X", 1, 1, 0.25],
        ["Z", "Y", 0, 0, 0.3],
        ["Z", "Y", 1, 0, 0.3],
        ["Z", "Y", 2, 0, 0.4],
        ["Z", "Y", 0, 1, 0.8],
        ["Z", "Y", 1, 1, 0.1],
        ["Z", "Y", 2, 1, 0.1],
    ],
    columns=[
        "Variable",
        "Conditioning Variable",
        "Value of Variable",
        "Value of Conditioning Variable",
        "Probability",
    ],
)


def get_expression(row):
    if row["Conditioning Variable"] is None:
        return f"P({row['Variable']} = {row['Value of Variable']})"
    else:
        return f"P({row['Variable']} = {row['Value of Variable']} | {row['Conditioning Variable']} = {int(row['Value of Conditioning Variable'])})"


df["Expression"] = df.apply(
    lambda row: get_expression(row),
    axis=1,
)
df.set_index("Expression", inplace=True)
print(df["Probability"])

Expression
P(X = 0)            0.30
P(X = 1)            0.70
P(Y = 0 | X = 0)    0.10
P(Y = 1 | X = 0)    0.90
P(Y = 0 | X = 1)    0.75
P(Y = 1 | X = 1)    0.25
P(Z = 0 | Y = 0)    0.30
P(Z = 1 | Y = 0)    0.30
P(Z = 2 | Y = 0)    0.40
P(Z = 0 | Y = 1)    0.80
P(Z = 1 | Y = 1)    0.10
P(Z = 2 | Y = 1)    0.10
Name: Probability, dtype: float64


def get_prob(var=None, val=None, cond_var=None, cond_val=np.nan):
    return df.query(
        f"Variable == @var & `Value of Variable` == @val & (`Value of Conditioning Variable` == @cond_val | `Value of Conditioning Variable`.isna())"
    )["Probability"].values[0]


import numpy as np

np.random.seed(0)

N = 1000
X = np.random.choice(
    [0, 1], size=N, replace=True, p=[get_prob("X", k) for k in [0, 1]]
)
Y_given_X_0 = np.random.choice(
    [0, 1], size=N, replace=True, p=[get_prob("Y", k, "X", 0) for k in [0, 1]]
)
Y_given_X_1 = np.random.choice(
    [0, 1], size=N, replace=True, p=[get_prob("Y", k, "X", 1) for k in [0, 1]]
)
Y = np.where(X, Y_given_X_1, Y_given_X_0)

Z_given_Y_0 = np.random.choice(
    [0, 1, 2],
    size=N,
    replace=True,
    p=[get_prob("Z", k, "Y", 0) for k in [0, 1, 2]],
)
Z_given_Y_1 = np.random.choice(
    [0, 1, 2],
    size=N,
    replace=True,
    p=[get_prob("Z", k, "Y", 1) for k in [0, 1, 2]],
)
Z = np.where(Y, Z_given_Y_1, Z_given_Y_0)


import pandas as pd

data = {}
for var_name, var in list(zip(["X", "Y", "Z"], [X, Y, Z])):
    ks = [0, 1]
    if var_name == "X":
        cond_var = None
    elif var_name == "Y":
        cond_var = X
        cond_var_name = "X"
    else:
        cond_var = Y
        cond_var_name = "Y"
        ks = [0, 1, 2]
    for k in ks:
        if cond_var is None:
            mle = (var == k).mean()
            data.update({f"P({var_name} = {k})": mle})
        else:
            for c in [0, 1]:
                mle = (var[np.where(cond_var == c)[0]] == k).mean()
                data.update(
                    {f"P({var_name} = {k} | {cond_var_name} = {c})": mle}
                )

mle_df = pd.DataFrame.from_dict(data, orient="index")
mle_df.columns = ["MLE"]
df["MLE"] = mle_df
df[["Probability", "MLE"]]


def get_mle(X, Y, Z):
    result = np.zeros((2, 2, 3))
    for r in [0, 1]:
        for s in [0, 1]:
            for t in [0, 1, 2]:
                result[r, s, t] = sum((X == r) & (Y == s) & (Z == t)) / N
    return result


B = 1000
theta_hat_boot = np.zeros((B, 2, 2, 3))
for b in tqdm(range(B)):
    sample_indices = np.random.choice(range(N), size=N, replace=True)
    X_sample = X[sample_indices]
    Y_sample = Y[sample_indices]
    Z_sample = Z[sample_indices]
    theta_hat_boot[b] = get_mle(X_sample, Y_sample, Z_sample)
se = theta_hat_boot.std(axis=0)
theta_hat = get_mle(X, Y, Z)
theta_hat = np.ravel(theta_hat)
se = np.ravel(se)
df = pd.DataFrame(
    {"Estimate": theta_hat, "LB": theta_hat - 2 * se, "UB": theta_hat + 2 * se}
)
df.index = [
    f"theta_{r}{s}{t}" for t in [0, 1, 2] for s in [0, 1] for r in [0, 1]
]
df

100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 1000/1000 [00:22<00:00, 44.50it/s]


g = Digraph()
for k in [1, 2, 3, 4]:
    g.edge("X", f"Y_{k}")
    g.edge(f"Z_{k}", f"Y_{k}")
g


Ns = np.logspace(1, 6, 100, dtype=int)
theoretical_value = expit(2) * expit(2) + expit(0) * expit(-2)
empirical_values = {}
for N in Ns:
    np.random.seed(0)
    X = np.random.choice([0, 1], size=N, replace=True)
    Y = np.where(np.random.uniform(size=N) < 1 / (1 + np.exp(2 - 4 * X)), 1, 0)
    Z = np.where(
        np.random.uniform(size=N) < 1 / (1 + np.exp(2 - 2 * (X + Y))), 1, 0
    )
    empirical_values[N] = Z[np.where(Y == 1)[0]].mean()

plt.plot(*zip(*sorted(empirical_values.items())), label="Empirical Value")
plt.hlines(
    y=theoretical_value,
    xmin=min(Ns),
    xmax=max(Ns),
    color="orange",
    label="Theoretical Value",
)
plt.xscale("log")
plt.xlabel("N")
plt.grid()
plt.legend()
plt.title("P(Z = 1 | Y = 1)")
plt.show()


Ns = np.logspace(1, 6, 100, dtype=int)
theoretical_value = expit(0) * expit(0) + expit(0) * expit(2)
empirical_values = {}
for N in Ns:
    np.random.seed(0)
    X = np.random.choice([0, 1], size=N, replace=True)
    # Y = np.where(np.random.uniform(size=N) < 1 / (1 + np.exp(2 - 4 * X)), 1, 0)
    Y = np.ones(shape=N)
    Z = np.where(
        np.random.uniform(size=N) < 1 / (1 + np.exp(2 - 2 * (X + Y))), 1, 0
    )
    empirical_values[N] = Z[np.where(Y == 1)[0]].mean()

plt.plot(*zip(*sorted(empirical_values.items())), label="Empirical Value")
plt.hlines(
    y=theoretical_value,
    xmin=min(Ns),
    xmax=max(Ns),
    color="orange",
    label="Theoretical Value",
)
plt.xscale("log")
plt.xlabel("N")
plt.grid()
plt.legend()
plt.title("P(Z = 1 | Y := 1)")
plt.show()


import sympy as sp
from IPython.display import display, Latex

x, y, z, alpha, beta, gamma = sp.symbols("x y z \\alpha \\beta \\gamma")
expression = (z - (beta * y + gamma * x)) ** 2 + (
    (y - alpha * x) ** 2 + x**2
)
print("Original Expression:")
display(expression)
expanded = sp.collect(
    sp.expand(expression), syms=[x, y, z, x * y, x * z, y * z]
)
print("Expanded Expression:")
display(expanded)

matrix = sp.Matrix(
    [
        [alpha**2 + gamma**2 + 1, (beta * gamma - alpha), -gamma],
        [(beta * gamma - alpha), beta**2 + 1, -beta],
        [-gamma, -beta, 1],
    ]
)
display(Latex("$\Sigma^{-1}$:"))
display(matrix)
display(Latex("$\Sigma$:"))
display(matrix.inv())

Original Expression:

Expanded Expression:


alpha, beta, gamma = sp.symbols("\\alpha \\beta \\gamma")
expression = (
    (alpha**2) * (beta**2)
    + 2 * alpha * beta * gamma
    + beta**2
    + gamma**2
    + 1
    - (((alpha**2) * beta + alpha * gamma + beta) ** 2 / (1 + alpha**2))
)
sp.simplify(expression)


x, y, z, alpha, beta, gamma = sp.symbols("x y z \\alpha \\beta \\gamma")
expr = (x**2) + (y - alpha) ** 2 + (z - beta * y - gamma * x) ** 2
sp.collect(
    sp.expand(expr), [x, y, z, x * y, x * z, y * z, x**2, y**2, z**2]
)

$Z = 0$	$Y = 0$	$Y = 1$		$Z = 1$	$Y = 0$	$Y = 1$
$X = 0$	$.405$	.$045$		$X = 0$	$.125$	$.125$
$X = 1$	$.045$	$0.005$		$X = 1$	$.125$	$.125$

	$Y = 0$	$Y = 1$
$X = 0$	$.81$	$.09$
$X = 1$	$.09$	$.01$

	$Y = 0$	$Y = 1$
$X = 0$	$.25$	$.25$
$X = 1$	$.25$	$.25$

$z$	$x$	$y$	$f_{X, Y \mid Z}(x, y \mid z)$	$f_{X \mid Z}(x \mid z)$	$f_{Y \mid Z}(y \mid z)$
0	0	0	$.81$	$.9$	$.9$
0	0	1	$.09$	$.9$	$.1$
0	1	0	$.09$	$.1$	$.9$
0	1	1	$.01$	$.1$	$.1$
1	0	0	$.25$	$.5$	$.5$
1	0	1	$.25$	$.5$	$.5$
1	1	0	$.25$	$.5$	$.5$
1	1	1	$.25$	$.5$	$.5$

	$Y = 0$	$Y = 1$
$X = 0$	$.53$	$.17$
$X = 1$	$.17$	$.13$

1¶

2¶

3¶

4¶

5¶

6¶

7¶

8¶

9¶

	Probability	MLE
Expression
P(X = 0)	0.30	0.307
P(X = 1)	0.70	0.693
P(Y = 0 \| X = 0)	0.10	0.101
P(Y = 1 \| X = 0)	0.90	0.899
P(Y = 0 \| X = 1)	0.75	0.746
P(Y = 1 \| X = 1)	0.25	0.254
P(Z = 0 \| Y = 0)	0.30	0.319
P(Z = 1 \| Y = 0)	0.30	0.319
P(Z = 2 \| Y = 0)	0.40	0.361
P(Z = 0 \| Y = 1)	0.80	0.816
P(Z = 1 \| Y = 1)	0.10	0.100
P(Z = 2 \| Y = 1)	0.10	0.084

	Estimate	LB	UB
theta_000	0.005	5.276e-04	0.009
theta_100	0.014	6.682e-03	0.021
theta_010	0.012	5.152e-03	0.019
theta_110	0.222	1.947e-01	0.249
theta_001	0.028	1.769e-02	0.038
theta_101	0.026	1.565e-02	0.036
theta_011	0.170	1.458e-01	0.194
theta_111	0.161	1.377e-01	0.184
theta_002	0.186	1.614e-01	0.211
theta_102	0.147	1.252e-01	0.169
theta_012	0.017	8.811e-03	0.025
theta_112	0.012	4.972e-03	0.019