import time
import math
import numpy as np
import pandas as pd
import datetime
import scipy as sc
import matplotlib.pyplot as plt
#from pandas_datareader import data as pdr
from IPython.display import display, Latex
from statsmodels.graphics.tsaplots import plot_acf, plot_pacf


from fredapi import Fred
fred_key = 'ffc8bae82c04b73a42221721a114855a'
fred = Fred(api_key=fred_key)
stock_price = fred.get_series('SP500')


log_price = np.log( stock_price/stock_price.shift(1) ).dropna()
log_price.plot()
plt.title('Daily Log Price')
plot_acf(log_price)
plt.show()

/Users/mie/opt/anaconda3/lib/python3.9/site-packages/pandas/core/arraylike.py:358: RuntimeWarning: invalid value encountered in log
  result = getattr(ufunc, method)(*inputs, **kwargs)


return_squared = np.square( log_price )
return_squared.plot()
plt.title('Squared Daily Return')
plot_acf(return_squared)
plt.show()


Trading_Days = 40
volatility = log_price.rolling(window=Trading_Days).std()*np.sqrt(252)
volatility = volatility.dropna()
volatility.plot()
#plot_acf(volatility)
#plot_pacf(volatility)
plt.show()


# calculate mu
def mu(x, dt, k, theta):
    ekt = np.exp( -k* dt ) # e^{-k dt}
    return x*ekt + theta*(1-ekt)

# calcuate sigma
def std( dt, k, sigma ):
    e2kt=np.exp( -2*k*dt ) # e^{-2k dt}
    return np.sqrt(  sigma**2/(2*k)*(1-e2kt)  )

# calculate the log-likelihood function
def log_likelihood_OU(theta_hat, x):
    k = theta_hat[0]
    theta = theta_hat[1]
    sigma = theta_hat[2]
    
    x_dt = x[1:]
    x_t = x[:-1]
    
    dt = 1/252
    
    mu_OU = mu(x_t, dt, k, theta)
    sigma_OU = std(dt, k, sigma)
    
    log_likelihood_func = np.sum( np.log( sc.stats.norm.pdf(x_dt, loc = mu_OU, scale = sigma_OU) ) )
    
    return - log_likelihood_func

# contraint, let k > 0
def k_positive(theta_hat):
    k = np.abs(theta_hat[0])
    return k

# contraint, let sigma > 0
def sigma_positive(theta_hat):
    sigma = np.abs(theta_hat[2])
    return sigma


vol = np.array(volatility)

# constraint equations are defined as dictionaries
cons_set = [ { 'type':'ineq', 'fun': k_positive },
            { 'type':'ineq', 'fun': sigma_positive } ]

# initial guess of parameter theta
# theta =[ k , theta , sigma ]
theta0 = [1,3,1]

# apply minimizer to find the MLE paramether
opt = sc.optimize.minimize( fun = log_likelihood_OU, x0 = theta0, args = (vol, ), constraints = cons_set)

# round our parameters
kappa = round(opt.x[0], 3)
theta = round(opt.x[1], 3)
sigma = round(opt.x[2], 3)
vol0 = vol[-1]

for_kappa_hat = '$\hat{\kappa} = '+str(kappa)+'$'
for_theta_hat = '$\hat{ \theta } = '+str(theta)+'$'
for_sigma_hat = '$\hat{\sigma} = '+str(sigma)+'$'
print('The MLE for data is:')
display(Latex(for_kappa_hat))
display(Latex(for_theta_hat))
display(Latex(for_sigma_hat))
print('Last Volatility', round(vol0,3))

The MLE for data is:

/var/folders/90/hk9jz15n56zckxcy3wlt2twh0000gn/T/ipykernel_41709/1550404899.py:25: RuntimeWarning: divide by zero encountered in log
  log_likelihood_func = np.sum( np.log( sc.stats.norm.pdf(x_dt, loc = mu_OU, scale = sigma_OU) ) )
/var/folders/90/hk9jz15n56zckxcy3wlt2twh0000gn/T/ipykernel_41709/1550404899.py:25: RuntimeWarning: invalid value encountered in log
  log_likelihood_func = np.sum( np.log( sc.stats.norm.pdf(x_dt, loc = mu_OU, scale = sigma_OU) ) )
/var/folders/90/hk9jz15n56zckxcy3wlt2twh0000gn/T/ipykernel_41709/2563713482.py:13: RuntimeWarning: invalid value encountered in double_scalars
  return sigma * np.sqrt((1 - e2kt ) / ( 2 * kappa))

Last Volatility 0.289


# Define Parameters
Time = 3
M = 10000

Z = np.random.normal(size=(M))

def mu(x, dt, kappa, theta):
    ekt = np.exp(- kappa * dt)
    return x * ekt + theta * (1 - ekt)

def std(dt, kappa, sigma):
    e2kt = np.exp( - 2 * kappa * dt )
    return sigma * np.sqrt((1 - e2kt ) / ( 2 * kappa))
                         
drift_OU = mu(vol0, Time, kappa, theta)
diffusion_OU = std( Time, kappa, theta )
vol_OU = drift_OU + diffusion_OU * Z

plt.hist(vol_OU)
plt.title('Ornsterin-Uhlenbeck Continuous Distribution @ Time')
plt.xlabel('Volatility')
plt.show()


days = 1
years = 2

dt = days/252

M = 1000
N = int(years/dt)


vol_OU = np.full( shape=(N,M), fill_value = vol0 )
Z = np.random.normal(size = (N,M))

def OU_recursive(t, vol_OU):
    # Return the final state
    if t == N:
        return vol_OU
    
    # Thread the state through the recursive call
    else:
        drift_OU = kappa*(theta - vol_OU[t-1])*dt
        diffusion_OU = sigma*np.sqrt(dt)
        vol_OU[t] = vol_OU[t-1] + drift_OU + diffusion_OU*Z[t]
        return OU_recursive(t + 1, vol_OU)
    
    
start_time = time.time() 
vol_OU = OU_recursive(0, vol_OU)
print('Execution time', time.time() - start_time)
vol_OU = np.concatenate( (np.full(shape=(1, M), fill_value=vol0), vol_OU ) )
plt.plot(vol_OU)
plt.title('Ornstein-Uhlenbeck Euler Discretization')
plt.ylabel('Volatility')
plt.show()

Execution time 0.007803916931152344


vol_OU = np.full(shape=(N, M), fill_value=vol0)
Z = np.random.normal(size=(N, M))
start_time = time.time()
for t in range(1,N):
    drift_OU = kappa*(theta - vol_OU[t-1])*dt
    diffusion_OU = sigma*np.sqrt(dt)
    vol_OU[t] = vol_OU[t-1] + drift_OU + diffusion_OU*Z[t]
print('Execution time', time.time() - start_time)
vol_OU = np.concatenate( (np.full(shape=(1, M), fill_value=vol0), vol_OU ) )
plt.plot(vol_OU)
plt.title('Ornstein-Uhlenbeck Euler Discretization')
plt.ylabel('Volatility')
plt.show()

Execution time 0.005856037139892578

Ornstein-Uhlenbeck¶

So what’s the distribution function of Ornstein-Uhlenbeck process?¶

MLE of Ornsterin-Uhlenbeck Process¶

Simulating Ornstein-Uhlenbeck Process:¶

Discrete SDE¶