ベイズ線形回帰

Contents

ベイズ線形回帰#

import matplotlib.pyplot as plt
import numpy as np
import scipy as sp

# データを作成
n = 1000

from scipy.stats import multivariate_normal
mean = np.array([3, 5])
Sigma = np.array([
    [1, 0.5],
    [0.5, 2],
])
X = multivariate_normal.rvs(mean=mean, cov=Sigma, size=n, random_state=0)

import statsmodels.api as sm
X = sm.add_constant(X)

# 真のパラメータ
beta = np.array([2, 3, 4])

データが均一分散の場合#

# 均一分散の場合
e = np.random.normal(loc=0, scale=1, size=n)
y = X @ beta + e

# 頻度主義
import statsmodels.api as sm
ols = sm.OLS(y, X).fit(cov_type="HC1")
ols.summary()

OLS Regression Results
Dep. Variable:	y	R-squared:	0.981
Model:	OLS	Adj. R-squared:	0.981
Method:	Least Squares	F-statistic:	2.747e+04
Date:	Tue, 02 Dec 2025	Prob (F-statistic):	0.00
Time:	14:36:20	Log-Likelihood:	-1398.4
No. Observations:	1000	AIC:	2803.
Df Residuals:	997	BIC:	2817.
Df Model:	2
Covariance Type:	HC1

	coef	std err	z	P>\|z\|	[0.025	0.975]
const	2.1570	0.126	17.136	0.000	1.910	2.404
x1	2.9851	0.031	95.584	0.000	2.924	3.046
x2	3.9792	0.024	165.219	0.000	3.932	4.026

Omnibus:	0.039	Durbin-Watson:	1.973
Prob(Omnibus):	0.981	Jarque-Bera (JB):	0.029
Skew:	-0.013	Prob(JB):	0.986
Kurtosis:	2.998	Cond. No.	25.9

Notes:
[1] Standard Errors are heteroscedasticity robust (HC1)

import pymc as pm
import arviz as az

model = pm.Model()
with model:
    beta0 = pm.Normal("beta0", mu=0, sigma=1)
    beta1 = pm.Normal("beta1", mu=0, sigma=1)
    beta2 = pm.Normal("beta2", mu=0, sigma=1)
    sigma = pm.HalfNormal("sigma", sigma=1)  # 分散なので非負の分布を使う

    # 平均値 mu
    mu = beta0 + beta1 * X[:, 1] + beta2 * X[:, 2]
    # 観測値をもつ確率変数は_obsとする
    y_obs = pm.Normal("y_obs", mu=mu, sigma=sigma, observed=y)

# モデルをGraphvizで表示
pm.model_to_graphviz(model)

../../_images/fb03ceaf312c1fca30b9c68df7e8c60286079296582d7f46adc0b8a18900d045.svg

# ベイズ線形回帰モデルをサンプリング
with model:
    idata = pm.sample(
        chains=2,
        tune=1000, # バーンイン期間の、捨てるサンプル数
        draws=2000, # 採用するサンプル数
        random_seed=0,
    )

# 各chainsの結果を表示
az.plot_trace(idata, figsize=[4, 4])
plt.tight_layout()
plt.show()

Initializing NUTS using jitter+adapt_diag...

Multiprocess sampling (2 chains in 2 jobs)

NUTS: [beta0, beta1, beta2, sigma]

Sampling 2 chains for 1_000 tune and 2_000 draw iterations (2_000 + 4_000 draws total) took 4 seconds.

We recommend running at least 4 chains for robust computation of convergence diagnostics

../../_images/a2975c37e511853f69c23059a0c92c48ca43c425f3eb5490500e025b7f16c0ec.png

az.plot_posterior(idata)
plt.show()

../../_images/498e5326c0b6316409f14d909c2fcfd57d4939c55f92eec13b983ce15ec03942.png

データが不均一分散の場合#

# 不均一分散の場合
def normalize(x):
    return (x - x.min()) / (x.max() - x.min())

sigma = 1 + normalize(X[:, 1] + X[:, 2]) * 3
e = np.random.normal(loc=0, scale=sigma, size=n)
y = X @ beta + e

頻度主義 & 不均一分散に頑健な誤差推定#

# 頻度主義
import statsmodels.api as sm
ols = sm.OLS(y, X).fit(cov_type="HC1")
ols.summary()

OLS Regression Results
Dep. Variable:	y	R-squared:	0.888
Model:	OLS	Adj. R-squared:	0.888
Method:	Least Squares	F-statistic:	3737.
Date:	Tue, 02 Dec 2025	Prob (F-statistic):	0.00
Time:	14:36:46	Log-Likelihood:	-2314.7
No. Observations:	1000	AIC:	4635.
Df Residuals:	997	BIC:	4650.
Df Model:	2
Covariance Type:	HC1

	coef	std err	z	P>\|z\|	[0.025	0.975]
const	2.7222	0.308	8.846	0.000	2.119	3.325
x1	2.7798	0.084	32.904	0.000	2.614	2.945
x2	3.9813	0.061	65.716	0.000	3.863	4.100

Omnibus:	24.021	Durbin-Watson:	1.941
Prob(Omnibus):	0.000	Jarque-Bera (JB):	45.431
Skew:	0.124	Prob(JB):	1.36e-10
Kurtosis:	4.014	Cond. No.	25.9

Notes:
[1] Standard Errors are heteroscedasticity robust (HC1)

↑ 切片の推定にバイアスが入っている

均一分散を想定したベイズ線形回帰#

import pymc as pm
import arviz as az

model = pm.Model()
with model:
    beta0 = pm.Normal("beta0", mu=0, sigma=1)
    beta1 = pm.Normal("beta1", mu=0, sigma=1)
    beta2 = pm.Normal("beta2", mu=0, sigma=1)
    sigma = pm.HalfNormal("sigma", sigma=1)  # 分散なので非負の分布を使う

    # 平均値 mu
    mu = beta0 + beta1 * X[:, 1] + beta2 * X[:, 2]
    # 観測値をもつ確率変数は_obsとする
    y_obs = pm.Normal("y_obs", mu=mu, sigma=sigma, observed=y)

# モデルをGraphvizで表示
pm.model_to_graphviz(model)

../../_images/fb03ceaf312c1fca30b9c68df7e8c60286079296582d7f46adc0b8a18900d045.svg

# ベイズ線形回帰モデルをサンプリング
with model:
    idata = pm.sample(
        chains=2,
        tune=1000, # バーンイン期間の、捨てるサンプル数
        draws=2000, # 採用するサンプル数
        random_seed=0,
    )

# 各chainsの結果を表示
az.plot_trace(idata, figsize=[4, 4])
plt.tight_layout()
plt.show()

Initializing NUTS using jitter+adapt_diag...

Multiprocess sampling (2 chains in 2 jobs)

NUTS: [beta0, beta1, beta2, sigma]

Sampling 2 chains for 1_000 tune and 2_000 draw iterations (2_000 + 4_000 draws total) took 4 seconds.

We recommend running at least 4 chains for robust computation of convergence diagnostics

../../_images/0a64716831fea39b0d159bd881ac1804fb5297e264668d26fbb367446c43ff95.png

az.plot_posterior(idata)
plt.show()

../../_images/7585e8fe0a2f87c47550cd1d1f6ef2b3d923312926f5388c8f1d44316091a561.png

不均一分散を想定したベイズ線形回帰（WIP）#

分散をxの関数にしたかった。以下コードで推定できるが個々の\(\sigma_i\)が別々に推定される形になって結果が見づらい。もっといい表し方はないものか。

import pymc as pm
import arviz as az

model = pm.Model()
with model:
    beta0 = pm.Normal("beta0", mu=0, sigma=1)
    beta1 = pm.Normal("beta1", mu=0, sigma=1)
    beta2 = pm.Normal("beta2", mu=0, sigma=1)

    # 誤差分散にも線形モデルを入れる
    w0 = pm.Normal("w0", mu=0, sigma=1)
    w1 = pm.Normal("w1", mu=0, sigma=1)
    w2 = pm.Normal("w2", mu=0, sigma=1)
    lam = pm.math.exp(w0 + w1 * X[:, 1] + w2 * X[:, 2])
    sigma = pm.Exponential("sigma", lam=lam)  # 分散なので非負の分布を使う

    # 平均値 mu
    mu = beta0 + beta1 * X[:, 1] + beta2 * X[:, 2]
    # 観測値をもつ確率変数は_obsとする
    y_obs = pm.Normal("y_obs", mu=mu, sigma=sigma, observed=y)

# モデルをGraphvizで表示
pm.model_to_graphviz(model)

# ベイズ線形回帰モデルをサンプリング
with model:
    idata = pm.sample(
        chains=2,
        tune=1000, # バーンイン期間の、捨てるサンプル数
        draws=2000, # 採用するサンプル数
        random_seed=0,
    )

# 各chainsの結果を表示
az.plot_trace(idata, figsize=[4, 4])
plt.tight_layout()
plt.show()

az.plot_posterior(idata)
plt.show()