import numpy as np
import matplotlib.pyplot as plt

from quantrocket.master import get_securities
from quantrocket import get_prices

msft_sid = get_securities(symbols='MSFT', vendors='usstock').index[0]

start = "2015-01-01"
end = "2016-01-01"

prices = get_prices("usstock-free-1min", data_frequency='daily', sids=msft_sid, start_date=start, end_date=end, fields='Close')
msft_prices = prices.loc['Close'][msft_sid]

# plot prices
ax = msft_prices.plot()
ax.set_ylabel('Price');

# transform it into returns
msft_returns = msft_prices.pct_change()[1:]

ax = msft_returns.plot()
ax.set_ylabel('Returns');

# Plot a standard normal distribution and mark the critical regions with shading
x = np.linspace(-3, 3, 100)
norm_pdf = lambda x: (1/np.sqrt(2 * np.pi)) * np.exp(-x * x / 2)
y = norm_pdf(x)

fig, ax = plt.subplots(1, 1, sharex=True)
ax.plot(x, y)
ax.fill_between(x, 0, y, where = x > 1.96)
ax.fill_between(x, 0, y, where = x < -1.96)
plt.title('Rejection regions for a two-tailed hypothesis test at 95% confidence')
plt.xlabel('x')
plt.ylabel('p(x)');

n = len(msft_returns)
test_statistic = ((msft_returns.mean() - 0) /
                (msft_returns.std()/np.sqrt(n)))
print('t test statistic: ', test_statistic)

t test statistic:  0.8410571845968116

from scipy.stats import t

p_val = 2 * (1 - t.cdf(test_statistic, n - 1))
print('P-value is: ', p_val)

P-value is:  0.40111962686198677

securities = get_securities(symbols=['SPY', 'AAPL'], vendors='usstock')

start = '2015-01-01'
end = '2016-01-01'

closes = get_prices('usstock-free-1min', data_frequency='daily', sids=securities.index.tolist(), start_date=start, end_date=end, fields='Close').loc['Close']

sids_to_symbols = securities.Symbol.to_dict()
closes = closes.rename(columns=sids_to_symbols)

aapl_and_spy_returns = closes.pct_change()[1:]
aapl_and_spy_returns.plot()
plt.ylabel('Returns');

# Sample mean values
mu_spy = aapl_and_spy_returns['SPY'].mean()
mu_aapl = aapl_and_spy_returns['AAPL'].mean()
s_spy = aapl_and_spy_returns['SPY'].std()
s_aapl = aapl_and_spy_returns['AAPL'].std()
n_spy = len(aapl_and_spy_returns['SPY'])
n_aapl = len(aapl_and_spy_returns['AAPL'])

test_statistic = ((mu_spy - mu_aapl) - 0)/((s_spy**2/n_spy) + (s_aapl**2/n_aapl))**0.5
df = ((s_spy**2/n_spy) + (s_aapl**2/n_aapl))**2/(((s_spy**2 / n_spy)**2 /n_spy)+((s_aapl**2 / n_aapl)**2/n_aapl))

print('t test statistic: ', test_statistic)
print('Degrees of freedom (modified):', df)

t test statistic:  0.03288029678361224
Degrees of freedom (modified): 401.68304097450897

from scipy.stats import chi2

# Here we show what a chi-square looks like
x = np.linspace(0, 8, 100)
y_1 = chi2.pdf(x, 1)
y_2 = chi2.pdf(x, 2)
y_3 = chi2.pdf(x, 3)
y_4 = chi2.pdf(x, 4)
y_6 = chi2.pdf(x, 6)
y_9 = chi2.pdf(x, 9)

fig, ax = plt.subplots()
ax.plot(x, y_1, label = 'k = 1')
ax.plot(x, y_2, label = 'k = 2')
ax.plot(x, y_3, label = 'k = 3')
ax.plot(x, y_4, label = 'k = 4')
ax.plot(x, y_6, label = 'k = 6')
ax.plot(x, y_9, label = 'k = 9')
ax.legend()
plt.title('Chi-Square distribution with k degrees of freedom')
plt.xlabel('x')
plt.ylabel('p(x)');

msft_returns.plot()
plt.ylabel('Returns');

test_statistic = (len(msft_returns) - 1) * msft_returns.std()**2 / 0.0001
print('Chi-square test statistic:', test_statistic)

Chi-square test statistic: 792.2349828818994

# Here we calculate the critical value directly because our df is too high for most chisquare tables
crit_value = chi2.ppf(0.99, len(msft_returns) - 1)
print('Critical value at a = 0.01 with 251 df:', crit_value)

Critical value at a = 0.01 with 251 df: 304.9395557339572

# AAPL and SPY variances from above
spy_std_dev = aapl_and_spy_returns['SPY'].std()
aapl_std_dev = aapl_and_spy_returns['AAPL'].std()
print('SPY standard deviation is:', spy_std_dev)
print('AAPL standard deviation is:', aapl_std_dev)

SPY standard deviation is: 0.00974063235659978
AAPL standard deviation is: 0.01686545757071526

test_statistic = (aapl_std_dev / spy_std_dev)**2
print("F Test statistic:", test_statistic)

F Test statistic: 2.9979332080761387

# Since these values are taken over the same time period, they will have the same number of degrees of freedom
df1 = len(aapl_and_spy_returns['AAPL']) - 1
df2 = len(aapl_and_spy_returns['SPY']) - 1

print('Degrees of freedom for SPY:', df2)
print('Degrees of freedom for AAPL:', df1)

Degrees of freedom for SPY: 250
Degrees of freedom for AAPL: 250

from scipy.stats import f

upper_crit_value = f.ppf(0.975, df1, df2)
lower_crit_value = f.ppf(0.025, df1, df2)
print('Upper critical value at a = 0.05 with df1 = {0} and df2 = {1}:'.format(df1, df2), upper_crit_value)
print('Lower critical value at a = 0.05 with df1 = {0} and df2 = {1}:'.format(df1, df2), lower_crit_value)

Upper critical value at a = 0.05 with df1 = 250 and df2 = 250: 1.2820806494835295
Lower critical value at a = 0.05 with df1 = 250 and df2 = 250: 0.7799821332634866

	True Situation
Decision	$H_0$ True	$H_0$ False
Do not reject $H_0$	Correct Decision	Type II Error
Reject $H_0$ (accept $H_A$)	Type I Error	Correct Decision

Hypothesis Testing¶

The Null and Alternative Hypothesis¶

Examples¶

Difficulty of Testing¶

Hypotheses Must be Testable¶

How to Perform Hypothesis Testing¶

Why is this all necessary?¶

Critical Value¶

Hypothesis Testing on Means¶

Hypothesis Testing on Variances¶

Comparing Two Variances¶

Other Resources¶