# The Phenomenon of Spurious Regression
import numpy as np
import pandas as pd
import statsmodels.formula.api as smf
import matplotlib.pyplot as plt
import scipy.stats as stats


# fix the random seed (I chose 753951):
np.random.seed(753951)

# I set T=500 and generate errors (ut and vt) from IIDN(0,1)
T=500
u=stats.norm.rvs(0,1,T)
u[0]=0
v=stats.norm.rvs(0,1,T)
v[0]=0


# Finally I generate actual nonstationary series from errors
x1=np.cumsum(u)
x2=np.cumsum(v)

hypotheticalData=pd.DataFrame({'x1':x1,'x2':x2})


plt.plot(x1,color='black',marker='',linestyle='solid', label='x1')
plt.plot(x2,color='red',marker='',linestyle='dotted', label='x2')
plt.ylabel('x1,x2')
plt.legend()
plt.savefig('//.../images/nonsense regression')


# get regression results with OLS
reg=smf.ols(formula='x1 ~ x2 ',data=hypotheticalData)
results=reg.fit()
print(results.summary())

                            OLS Regression Results                            
==============================================================================
Dep. Variable:                     x1   R-squared:                       0.202
Model:                            OLS   Adj. R-squared:                  0.201
Method:                 Least Squares   F-statistic:                     126.4
Date:                Sat, 28 Jan 2023   Prob (F-statistic):           2.77e-26
Time:                        20:26:44   Log-Likelihood:                -1943.8
No. Observations:                 500   AIC:                             3892.
Df Residuals:                     498   BIC:                             3900.
Df Model:                           1                                         
Covariance Type:            nonrobust                                         
==============================================================================
                 coef    std err          t      P>|t|      [0.025      0.975]
------------------------------------------------------------------------------
Intercept      0.4471      1.742      0.257      0.798      -2.976       3.870
x2             0.8312      0.074     11.241      0.000       0.686       0.976
==============================================================================
Omnibus:                     1954.485   Durbin-Watson:                   0.012
Prob(Omnibus):                  0.000   Jarque-Bera (JB):               46.378
Skew:                           0.310   Prob(JB):                     8.49e-11
Kurtosis:                       1.642   Cond. No.                         77.7
==============================================================================

Notes:
[1] Standard Errors assume that the covariance matrix of the errors is correctly specified.

The Phenomenon of Spurious Regression

A Closer Look at the Phenomenon of Spurious Regression.

The Occurrence of Spurious Regression¶

Pure random walk process¶

References¶