using Distributions, Random, Statistics

function dgp_keane_neal(; b=0, n=1000, F, rho)

    """
    Generates one sample of size n following the DGP of Keane & Neal (2024) p. 193.

    ### Input
    - `b`   -- structural coefficient β (default 0)
    - `n`   -- sample size (default 1000)
    - `F`   -- population first-stage F-statistic
    - `rho` -- degree of endogeneity ρ

    ### Output (named tuple)
    - `x`, `y`, `z` -- (n×1) vectors for regressor, outcome, and instrument
    """

    π   = sqrt(F / n)
    u   = randn(n)
    eta = randn(n)
    z   = randn(n)
    v   = rho * u + sqrt(1 - rho^2) * eta
    x   = π * z .+ v
    y   = b * x .+ u

    return (; x, y, z)

end

dgp_keane_neal (generic function with 1 method)


function ols_estimator(x, y)

    """
    OLS estimator for the simple linear model y = βx + u.

    ### Input
    - `x` -- (n×1) regressor vector
    - `y` -- (n×1) outcome vector

    ### Output (named tuple)
    - `bhat` -- OLS estimate of β
    - `se`   -- standard error
    - `t`    -- t-statistic
    """

    bhat = x \ y
    uhat = y - x * bhat
    s    = (uhat' * uhat) / length(y)
    se   = sqrt(s / (x' * x))
    t    = bhat / se

    return (; bhat, se, t)

end

ols_estimator (generic function with 1 method)


function iv_estimator(x, y, z)

    """
    Just-identified IV estimator with one endogenous variable and one instrument.

    ### Input
    - `x` -- (n×1) endogenous regressor
    - `y` -- (n×1) outcome vector
    - `z` -- (n×1) instrument vector

    ### Output (named tuple)
    - `bhat` -- IV estimate of β
    - `se`   -- standard error (Keane & Neal 2024, p. 190)
    - `t`    -- t-statistic

    ### Notes
    The SE uses the first-stage ESS = N·π̂²·Var(z) as the relevance measure.
    """

    bhat  = (z' * y) / (z' * x)   # β̂_IV = (z'y)/(z'x)

    n     = length(y)
    pihat = z \ x                  # first-stage coefficient π̂
    ESS   = n * pihat^2 * var(z)   # first-stage explained sum of squares
    uhat  = y - x * bhat
    s     = (uhat' * uhat) / n
    se    = sqrt(s / ESS)

    t = bhat / se

    return (; bhat, se, t)

end

iv_estimator (generic function with 1 method)


function simulate_distribution(; b=0, F, rho, n=1000, rep=10000)

    """
    Monte Carlo simulation of OLS and IV estimator distributions.

    Creates `rep` independent datasets from dgp_keane_neal and collects
    estimates, standard errors, and t-statistics for OLS, IV, and the
    Anderson-Rubin (AR) test.

    ### Input
    - `b`   -- true structural coefficient β (default 0)
    - `F`   -- population first-stage F-statistic
    - `rho` -- degree of endogeneity ρ
    - `n`   -- sample size (default 1000)
    - `rep` -- number of Monte Carlo replications (default 10,000)

    ### Output (named tuple of rep-length vectors)
    - `bols_dst`, `sols_dst`, `tols_dst` -- OLS estimate, SE, t-statistic
    - `biv_dst`,  `siv_dst`,  `tiv_dst`  -- IV  estimate, SE, t-statistic
    - `ar_dst`                            -- AR t-statistic (OLS of Y on Z)
    """

    bols_dst = Vector{Float64}(undef, rep)
    sols_dst = Vector{Float64}(undef, rep)
    tols_dst = Vector{Float64}(undef, rep)
    biv_dst  = Vector{Float64}(undef, rep)
    siv_dst  = Vector{Float64}(undef, rep)
    tiv_dst  = Vector{Float64}(undef, rep)
    ar_dst   = Vector{Float64}(undef, rep)

    for i in 1:rep
        x, y, z = dgp_keane_neal(b=b, F=F, rho=rho, n=n)

        bols_dst[i], sols_dst[i], tols_dst[i] = ols_estimator(x, y)
        biv_dst[i],  siv_dst[i],  tiv_dst[i]  = iv_estimator(x, y, z)
        ar_dst[i] = ols_estimator(z, y).t   # AR: regress Y on Z directly
    end

    return (; bols_dst, sols_dst, tols_dst, biv_dst, siv_dst, tiv_dst, ar_dst)

end

simulate_distribution (generic function with 1 method)


Random.seed!(1234)   # set seed for reproducibility

parms_rho = (0.10, 0.50, 0.90)
parms_F   = (1.82, 2.30, 73.75)

dgps = [simulate_distribution(rho=rho, F=F) for rho in parms_rho, F in parms_F];


using Plots, LaTeXStrings
using Plots.PlotMeasures: mm
Plots.theme(:wong2)
gr(fmt=:png)

# ── Global defaults (apply to all subsequent plots) ──
default(
    fontfamily    = "Computer Modern",
    titlefontsize = 13,
    guidefontsize = 11,
    tickfontsize  = 9,
    legendfontsize = 9,
    left_margin   = 12mm,
    bottom_margin = 10mm,
    gridalpha     = 0.15,
    framestyle    = :box,
    lw            = 2,
    size          = (900, 500)
)

xgrid = range(-4, 4, length=200)

plt = plot(layout=(length(parms_rho), length(parms_F)),
    size=(1000, 700),
    plot_title="Empirical Distribution of IV t-statistic for Different DGPs",
    plot_titlefontsize=14)

for (i, rho) in enumerate(parms_rho)
    for (j, F) in enumerate(parms_F)
        k = length(parms_F) * (i-1) + j
        histogram!(plt,
            dgps[i,j].tiv_dst,
            normalize=true,
            subplot=k,
            bins=range(-4, 4, length=51),
            color="#6C9BC2",
            fillalpha=0.5,
            linecolor=:white,
            linewidth=0.5,
            legend=false,
            title=L"\rho=%$(rho),\; F=%$(F)",
            titlefontsize=10)
        plot!(plt, xgrid, pdf.(Normal(0,1), xgrid),
            subplot=k, lc="#0072B2", lw=2, label=false)
    end
end

display(plt)


Random.seed!(2024)

F_range  = 0:.25:20
emp_size = [mean(abs.(simulate_distribution(F=F, rho=1).tiv_dst) .> 1.96) for F in F_range]

plot(F_range, emp_size,
    legend=false,
    xlabel=L"Population $F$",
    ylabel="Empirical Size",
    xticks=0:2:20,
    yticks=0:0.05:1,
    size=(900, 500),
    lw=2.5,
    lc="#0072B2")
hline!([0.15], linestyle=:dash, lc="#009E73", lw=1.5)
hline!([0.05], linestyle=:dash, lc="#009E73",  lw=1.5)
ylims!(0, 1)
title!(L"Empirical Size of IV $t$-test vs Population $F$ (worst case: $\rho$ = 1)")


# Under the DGP, sample F follows a noncentral χ²(1, μ) distribution
# with noncentrality parameter μ = population F.
# We plot the CDFs to read off the 95th percentile of sample F for each population F.

popF_values = [1.82, 2.30, 5.78, 10.00, 29.44, 73.75]
linewidths  = [1.5,  2.5,  1.5,  1.5,   1.5,   1.5]

plt_nc = plot(
    size=(900, 500),
    legend=:bottomright,
    xticks=0:10:120,
    title=L"Noncentral $\chi_1^2(\mu)$: CDF of $\widehat{F}$ for Various Population $F$ Values",
    xlabel=L"Sample $\widehat{F}$",
    ylabel="CDF")

for (μ, lw) in zip(popF_values, linewidths)
    plot!(plt_nc, x -> cdf(NoncentralChisq(1, μ), x), 0, 120,
        label=L"$F = %$(μ)$", lw=lw)
end

hline!([0.95], linestyle=:dash, lc=:gray50, lw=1.2, label=false)
vline!([10],   linestyle=:dash, lc=:gray50, lw=1.2, label=false)
annotate!(65, 0.91, text("95th percentile", 9, :gray40))
annotate!(11.5, 0.15, text(L"$\widehat{F} = 10$", 9, :gray40))

display(plt_nc)


Random.seed!(5678)

rho_range = 0:0.05:1.0
emp_size  = [mean(abs.(simulate_distribution(F=1.82, rho=rho).tiv_dst) .> 1.96) for rho in rho_range]

plot(rho_range, emp_size,
    lw=2.5,
    lc="#0072B2",
    legend=false,
    xlabel=L"Degree of Endogeneity $\rho$",
    ylabel="Empirical Size",
    size=(900, 500))
hline!([0.05], linestyle=:dash, lc=:black, lw=1.2)
annotate!(0.12, 0.058, text("5% nominal size", 9, :gray40))
vline!([0.45], linestyle=:dot, lc="#009E73", lw=2)
annotate!(0.51, 0.21, text(L"\rho = 0.45", 10, "#009E73"))
ylims!(0, 0.22)
title!(L"Empirical Size vs $\rho$ (population $F$ = 1.82, sample $\widehat{F}$ 95th pct $\approx$ 8.96)")

Population F	Sample F (95th pct)	Worst-case empirical size
1.82	≈ 8.96	15%
2.30	= 10.00	13.5% (Rule of Thumb)
73.75	≈ 104.70	≈ 5% (nominal level)

	Mean zero ($\mu = 0$)	Mean nonzero ($\mu \neq 0$)
$Z \sim N(\mu, 1)$	Centered at 0	Shifted right
$Z^2 \sim \;?$	$\chi^2_1$ (central)	$\chi^2_1(\mu^2)$ (noncentral)

Case	population F	sample F	Worst case empirical size (when $\rho=1$)
1	1.82	8.96	15\%
2	2.30	10.00	13.5\%
3	5.78	16.38	10\%
4	10.00	23.10	8.6\%
5	29.44	50.00	6.4\%
6	73.75	104.70	5.0\%

Concept	Key Result
2SLS bias (Week 7)	$\propto L\rho/F$ — large $F$ suppresses bias
Empirical size	Inflated above 5% when $F$ is small; worst case at $\rho=1$
Rule of Thumb	Sample $F > 10$ $\Leftrightarrow$ pop. $F > 2.30$ $\Leftrightarrow$ worst-case size ≈ 13.5%
Worst-case realism	$\rho=1$ is conservative; realistic $\rho$ values give better size properties

Lecture 8: When Are Instruments Strong? Understanding Stock & Yogo (2005)¶

Recap of Week 7¶

Road Map¶

Data Generating Process (DGP)¶

Julia Functions¶

Creating Simulated Distributions¶

Distribution of the IV t-Statistic¶

Reading the Plots¶

Empirical Size and the Stock & Yogo (2005) Approach¶

Formalising the Problem¶

Stock & Yogo's Strategy¶

Reading the Size Plot¶

Stock & Yogo's Threshold Rule¶

Digression: Population F vs Sample F¶

Primer: Central $\chi^2_1$¶

Primer: Noncentral $\chi^2_1$¶

Quick visual intuition¶

Reading the Noncentral $\chi^2$ Plot¶

Is the Worst Case too Pessimistic?¶

What Does This Tell Us?¶

Summary and Preview of Week 9¶

DGP	Population F	$\rho$	Description
1	1.82	0.10	weak IV, low endogeneity
2	2.30	0.10	rule of thumb IV, low endogeneity
3	73.75	0.10	strong IV, low endogeneity (benchmark)
4	1.82	0.50	weak IV, moderate endogeneity
5	2.30	0.50	rule of thumb IV, moderate endogeneity
6	73.75	0.50	strong IV, moderate endogeneity
7	1.82	0.90	weak IV, high endogeneity
8	2.30	0.90	rule of thumb IV, high endogeneity
9	73.75	0.90	strong IV, high endogeneity