!pip install -q numpy pandas statsmodels scipy matplotlib

import numpy as np, pandas as pd
import statsmodels.api as sm
from scipy import stats
import matplotlib.pyplot as plt
np.random.seed(320)

[notice] A new release of pip is available: 25.2 -> 25.3
[notice] To update, run: pip install --upgrade pip

# Two-sided shading under a Student-t distribution (with legend)
t_obs = 1.5      # change this to demo different cases
n = 200
k = 3
df_demo = n - (k + 1)  # set to something like n-(k+1); increase to see it approach normal

xs = np.linspace(-4, 4, 800)
plt.figure(figsize=(6,4))

# Curves
plt.plot(xs, stats.t.pdf(xs, df=df_demo), label=f"t (df={df_demo})")
plt.plot(xs, stats.norm.pdf(xs), label="Normal(0,1)")

# Shaded two-sided p region under t
mask = (xs <= -abs(t_obs)) | (xs >= abs(t_obs))
plt.fill_between(xs, 0, stats.t.pdf(xs, df=df_demo), where=mask, alpha=0.3, label="Two-sided p region")

plt.title(f"Two-sided p-value shading for t_obs = {t_obs}, df = {df_demo}")
plt.xlabel("t"); plt.ylabel("density")
plt.legend(loc="upper right", frameon=False)
plt.show()

# --- DGP ---
n = 200
x1 = np.random.normal(size=n)
x2 = np.random.normal(size=n)
x3 = np.random.normal(size=n)

# True coefficients
beta0, beta1, beta2, beta3 = 1.0, 0.0, 0.8, -0.5  # H0 is true for beta1
u = np.random.normal(size=n)
y = beta0 + beta1*x1 + beta2*x2 + beta3*x3 + u

# --- DataFrame ---
X = pd.DataFrame({'x1': x1, 'x2': x2, 'x3': x3})

# --- Fit OLS ---
X = sm.add_constant(X)  # adds intercept
m = sm.OLS(y, X).fit()
print(m.summary())

                            OLS Regression Results                            
==============================================================================
Dep. Variable:                      y   R-squared:                       0.472
Model:                            OLS   Adj. R-squared:                  0.464
Method:                 Least Squares   F-statistic:                     58.40
Date:                Fri, 31 Oct 2025   Prob (F-statistic):           5.10e-27
Time:                        05:13:09   Log-Likelihood:                -288.58
No. Observations:                 200   AIC:                             585.2
Df Residuals:                     196   BIC:                             598.3
Df Model:                           3                                         
Covariance Type:            nonrobust                                         
==============================================================================
                 coef    std err          t      P>|t|      [0.025      0.975]
------------------------------------------------------------------------------
const          0.9139      0.073     12.434      0.000       0.769       1.059
x1            -0.0341      0.072     -0.471      0.638      -0.177       0.109
x2             0.7863      0.072     10.952      0.000       0.645       0.928
x3            -0.6166      0.074     -8.311      0.000      -0.763      -0.470
==============================================================================
Omnibus:                        1.336   Durbin-Watson:                   2.082
Prob(Omnibus):                  0.513   Jarque-Bera (JB):                1.021
Skew:                           0.155   Prob(JB):                        0.600
Kurtosis:                       3.164   Cond. No.                         1.13
==============================================================================

Notes:
[1] Standard Errors assume that the covariance matrix of the errors is correctly specified.

# Joint test H0: x2 = 0 and x3 = 0  (q = 2)

# Fit UR (const + x1 + x2 + x3) and R (const + x1)
X_ur = sm.add_constant(pd.DataFrame({'x1': x1, 'x2': x2, 'x3': x3}))
fit_ur = sm.OLS(y, X_ur).fit()
X_r  = sm.add_constant(pd.DataFrame({'x1': x1}))
fit_r = sm.OLS(y, X_r).fit()

# Manual F
SSR_UR, SSR_R = fit_ur.ssr, fit_r.ssr
q = 2
n, p = int(fit_ur.nobs), X_ur.shape[1]
df2 = n - p
F_manual = ((SSR_R - SSR_UR)/q) / (SSR_UR/df2)
p_manual = 1 - stats.f.cdf(F_manual, q, df2)
print({'F_manual': float(F_manual), 'p_manual': float(p_manual), 'df1': q, 'df2': df2})

# statsmodels f_test (same null)
print(fit_ur.f_test("x2 = 0, x3 = 0"))

# Optional decision (two-sided, level alpha)
alpha = 0.05
print("Decision @ alpha=0.05:", "REJECT H0" if p_manual < alpha else "Do NOT reject H0")

{'F_manual': 87.56190320272353, 'p_manual': 1.1102230246251565e-16, 'df1': 2, 'df2': 196}
<F test: F=87.56190320272353, p=6.7336608095612395e-28, df_denom=196, df_num=2>
Decision @ alpha=0.05: REJECT H0

ECON320 Week 9 — Inference: t & F Tests (Completed version)¶

📦 Required libraries¶

1) Motivation for t-tests: compare your estimate to a 0-mean normal under H₀¶

🔭 Tiny visual: exact Student‑$t$ (finite sample) with normal overlay (asymptotic)¶

2) Single‑coefficient t test in practice¶

Workflow (two-sided t-test)¶

Code: synthetic data + a single‑coefficient t test¶

Setting for this demo: synthetic data where the null is true for $\,\beta_1\,$¶

4) From t to F: testing multiple coefficients at once¶

Code: Compute F test manually and via `statsmodels` `f_test`¶

References & Acknowledgments¶

ECON320 Week 9 — Inference: t & F Tests (Completed version)¶

📦 Required libraries¶

1) Motivation for t-tests: compare your estimate to a 0-mean normal under H₀¶

🔭 Tiny visual: exact Student‑$t$ (finite sample) with normal overlay (asymptotic)¶

2) Single‑coefficient t test in practice¶

Workflow (two-sided t-test)¶

Code: synthetic data + a single‑coefficient t test¶

Setting for this demo: synthetic data where the null is true for $\,\beta_1\,$¶

4) From t to F: testing multiple coefficients at once¶

Code: Compute F test manually and via statsmodels f_test¶

References & Acknowledgments¶

Code: Compute F test manually and via `statsmodels` `f_test`¶