import scipy.stats as stats


# Number of examples
N = 50
height = stats.norm.rvs(185, 20, size=N)


height

array([217.70370906, 176.62474253, 135.48839208, 204.33018221,
       221.2555992 , 192.73927388, 174.12544474, 186.39726947,
       176.37460251, 201.62819558, 175.0154484 , 194.84015413,
       189.30342283, 154.63882221, 210.05528764, 158.86074527,
       171.47967362, 155.53749026, 213.99510896, 179.42324713,
       168.75907485, 168.02791729, 221.87242679, 193.84679686,
       171.35573273, 166.42480703, 195.54374488, 164.44516731,
       140.24767869, 193.96779659, 164.04046969, 189.8870312 ,
       195.20294169, 165.55226134, 196.28057687, 203.89512562,
       201.50696961, 220.71966871, 165.54022251, 186.40398498,
       177.21034541, 203.59587076, 151.13211769, 161.9524153 ,
       165.19785122, 132.13229663, 185.22403884, 168.4897427 ,
       202.53181223, 141.45099719])


points = (height - height.mean())*0.5 + stats.norm.rvs(30, 4, size=N)


points

array([50.98368289, 30.14347858, 18.17825031, 41.86679753, 46.98424037,
       32.25986993, 20.5750566 , 27.47423342, 28.40703385, 41.41355882,
       34.39020317, 39.13316614, 36.54248156, 25.93125218, 38.40182353,
       13.3540376 , 28.6895941 , 10.62231361, 47.40030282, 28.08898817,
       27.60646253, 26.04813835, 48.47460193, 38.53430646, 29.91146428,
       30.12401774, 39.5892765 , 21.38121706, 11.47651907, 37.60164008,
       23.665808  , 40.66219594, 45.2138738 , 23.21787652, 41.4237737 ,
       36.91235783, 37.64458071, 50.00325272, 26.4958737 , 34.7052263 ,
       27.96821668, 37.99137941, 15.46501284, 16.92681691, 19.16976979,
        1.35238123, 37.6474833 , 24.23198908, 33.98225995, 17.88808647])


dollars = (points - points.mean())*2000 + stats.norm.rvs(150000, 30000, size=N)


dollars

array([251706.91468057, 171783.65971325, 106156.59966768, 183491.65137273,
       169012.37074299, 192148.93858638,  97453.00293163, 153819.90165495,
       156608.0653772 , 149728.45852434, 144763.8884134 , 206383.79440544,
       163765.72884044,  75136.39605974, 187341.05891388,  77759.12194905,
       154255.94268634,  50125.56390801, 179451.1305269 , 108481.11197453,
       153729.99324746,  85335.12083463, 190052.33208607,  93042.13744746,
       123587.6808668 , 133570.6119705 , 176300.69536791, 135149.51393847,
       108905.45562505, 173697.32608022, 159114.92528045, 157367.06658104,
       188405.86898049,  94843.8795158 ,  94666.16959798, 175820.24743537,
       147365.72331752, 143556.87772374, 132468.48992668, 151884.11053819,
       170479.32934139, 128916.58238489, 112649.33112641, 117827.63623242,
       100802.6706479 , 105239.47890317, 154645.20691575, 129758.21943312,
       157983.49600463, 167387.79734218])


import pymc3 as pm


height_std = (height - height.mean()) / height.std()
points_std = (points - points.mean()) / points.std()
dollars_std = (dollars - dollars.mean()) / dollars.std()


with pm.Model() as m1:
    sigma = pm.Lognormal('sigma', mu=1, sd=2)
    alpha = pm.Normal('alpha', mu=0, sd=1)
    beta = pm.Normal('beta', mu=0, sd=1)
    mu = alpha + beta*(points_std - points_std.mean())
    dollars_preds = pm.Normal('dollars', mu=mu, sd=sigma, observed=dollars_std)


def plot_predictive(prior_check):
    _, ax = plt.subplots()

    x = np.linspace(-2.5, 2.5, 50)

    for a, b in zip(prior_check["alpha"], prior_check["beta"]):
        y = a + b * x
        ax.plot(x, y, c="k", alpha=0.4)

    ax.set_xlabel("Predictor")
    ax.set_ylabel("Mean Outcome")


with m1:
    prior_check = pm.sample_prior_predictive()


import matplotlib.pyplot as plt
import numpy as np


with m1:
    trace = pm.sample(1000, tune=1000)

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/ipykernel_launcher.py:2: FutureWarning: In v4.0, pm.sample will return an `arviz.InferenceData` object instead of a `MultiTrace` by default. You can pass return_inferencedata=True or return_inferencedata=False to be safe and silence this warning.
  
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [beta, alpha, sigma]

Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 12 seconds.


plot_predictive(trace)


with pm.Model() as m1:
    sigma = pm.Lognormal('sigma', mu=1, sd=2)
    alpha = pm.Normal('alpha', mu=0, sd=1)
    beta = pm.Normal('beta', mu=0, sd=1)
    mu = alpha + beta*(height_std)
    dollars_preds = pm.Normal('dollars', mu=mu, sd=sigma, observed=dollars_std)


with m1:
    trace = pm.sample(1000, tune=1000)

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/ipykernel_launcher.py:2: FutureWarning: In v4.0, pm.sample will return an `arviz.InferenceData` object instead of a `MultiTrace` by default. You can pass return_inferencedata=True or return_inferencedata=False to be safe and silence this warning.
  
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [beta, alpha, sigma]

Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 11 seconds.


plot_predictive(trace)


with pm.Model() as m1:
    sigma = pm.Lognormal('sigma', mu=1, sd=2)
    alpha = pm.Normal('alpha', mu=0, sd=1)
    beta = pm.Normal('beta', mu=0, sd=1)
    beta_2 = pm.Normal('beta_2', mu=0, sd=1)
    mu = alpha + beta*(height_std) + beta_2*(points_std)
    dollars_preds = pm.Normal('dollars', mu=mu, sd=sigma, observed=dollars_std)


with m1:
    trace = pm.sample(1000, tune=1000)

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/ipykernel_launcher.py:2: FutureWarning: In v4.0, pm.sample will return an `arviz.InferenceData` object instead of a `MultiTrace` by default. You can pass return_inferencedata=True or return_inferencedata=False to be safe and silence this warning.
  
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [beta_2, beta, alpha, sigma]

Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 14 seconds.


plot_predictive(trace)


def plot_predictive(prior_check):
    _, ax = plt.subplots()

    x = np.linspace(-2.5, 2.5, 50)

    for a, b in zip(prior_check["alpha"], prior_check["beta_2"]):
        y = a + b * x
        ax.plot(x, y, c="k", alpha=0.4)

    ax.set_xlabel("Predictor")
    ax.set_ylabel("Mean Outcome")


plot_predictive(trace)


weight = np.array([135, 141, 127, 120, 133, 161, 160, 138, 127, 107, 146, 128, 147, 110, 133, 156, 136, 131, 168, 109, 143, 177, 140, 107])
bouldering = np.array([10, 10, 6, 5, 7, 8, 5, 6, 7, 8, 5, 13, 13, 5, 9, 8, 9, 6, 4, 8, 7, 3, 10, 3])
# strength to weight ratio of the left hand
hand_l_ratio = np.array([81.48, 92.2, 62.99, 54.17, 71.43, 71.43, 53.75, 47.1, 70.87, 80.37, 46.58, 100, 102.04, 54.55, 82.71, 72.44, 88.24, 68.7, 57.14, 80.73, 61.05, 77.97, 90.71, 46.73])


assert len(weight) == len(bouldering)
assert len(hand_l_ratio) == len(bouldering)


# Raw strength of left hand
hand_l = (hand_l_ratio / 100)*weight


plt.scatter(weight, bouldering)

<matplotlib.collections.PathCollection at 0x7fde61a40bd0>


plt.scatter(hand_l, bouldering)

<matplotlib.collections.PathCollection at 0x7fdeb19f08d0>


plt.scatter(hand_l, weight)

<matplotlib.collections.PathCollection at 0x7fde6154b850>


weight_std = (weight - weight.mean()) / weight.std()
hand_l_std = (hand_l - hand_l.mean()) / hand_l.std()
bouldering_std = (bouldering - bouldering.mean()) / bouldering.std()


with pm.Model() as m:
    a = pm.Normal('a', 0, 0.2)
    bS = pm.Normal('bS', 0, 0.5)
    bW = pm.Normal('bW', 0, 0.5)
    sigma = pm.Exponential('sigma', 1)
    mu = a + bS * hand_l_std + bW * weight_std
    grade = pm.Normal('grade', mu, sigma, observed=bouldering_std)


with m:
    prior_check = pm.sample_prior_predictive(samples=50)


def plot_predictive(prior_check, a_key='a', b_key='b'):
    _, ax = plt.subplots()

    x = np.linspace(-2.5, 2.5, 50)

    for a, b in zip(prior_check[a_key], prior_check[b_key]):
        y = a + b * x
        ax.plot(x, y, c="k", alpha=0.4)

    ax.set_xlabel("Predictor")
    ax.set_ylabel("Mean Outcome")


plot_predictive(prior_check, 'a', 'bW')


import arviz as az


def plot_linear_hdi(a_samples, b_samples, sigma_samples, x_seq):
    obs_samples = []
    for i in range(len(a_samples)):
        mu_sample = a_samples[i] + b_samples[i]*x_seq
        sigma_sample = sigma_samples[i]
        obs_samples.append(np.random.normal(mu_sample, sigma_sample))
    obs_samples = np.array(obs_samples)
    
    # The distribution over observed samples
    az.plot_hdi(x_seq, obs_samples, hdi_prob=0.97)
    
    # The MAP estimate of the relationship
    plt.plot(x_seq, a_samples.mean() + b_samples.mean()*x_seq, color='black')
    
    mu_pred = np.array([a_samples + b_samples*x for x in x_seq]).T
    # The distribution of the mean of mu.
    az.plot_hdi(x_seq, mu_pred, hdi_prob=0.97, color='blue')


plot_linear_hdi(prior_check['a'], prior_check['bW'], prior_check['sigma'], np.linspace(-2, 2, num=30))

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,
/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,


with m:
    trace = pm.sample(1000, tune=1000, return_inferencedata=False)

Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [sigma, bW, bS, a]

Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 11 seconds.


# There is a negative relationship between weight and bouldering grade when we control for finger strength.
plot_linear_hdi(trace['a'], trace['bW'], trace['sigma'], np.linspace(-2, 2, num=30))

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,
/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,


# There is a strong positive correlation between finger strength and bouldering grade
plot_linear_hdi(trace['a'], trace['bS'], trace['sigma'], np.linspace(-2, 2, num=30))

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,
/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,


with pm.Model() as m:
    a = pm.Normal('a', 0, 0.2)
    bS = pm.Normal('bS', 0, 0.5)
    bW = pm.Normal('bW', 0, 0.5)
    sigma = pm.Exponential('sigma', 1)
    mu = a + bW * weight_std
    grade = pm.Normal('grade', mu, sigma, observed=bouldering_std)


with m:
    trace = pm.sample(1000, tune=1000)

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/ipykernel_launcher.py:2: FutureWarning: In v4.0, pm.sample will return an `arviz.InferenceData` object instead of a `MultiTrace` by default. You can pass return_inferencedata=True or return_inferencedata=False to be safe and silence this warning.
  
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [sigma, bW, bS, a]

Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 12 seconds.


# But when we don't control for finger strength the relationship between weight and bouldering grade is very subtle.
plot_linear_hdi(trace['a'], trace['bW'], trace['sigma'], np.linspace(-2, 2, num=30))

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,
/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,


with pm.Model() as m:
    a = pm.Normal('a', 0, 0.2)
    bS = pm.Normal('bS', 0, 0.5)
    bW = pm.Normal('bW', 0, 0.5)
    sigma = pm.Exponential('sigma', 1)
    mu = a + bS * hand_l_std
    grade = pm.Normal('grade', mu, sigma, observed=bouldering_std)


with m:
    trace = pm.sample(1000, tune=1000)

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/ipykernel_launcher.py:2: FutureWarning: In v4.0, pm.sample will return an `arviz.InferenceData` object instead of a `MultiTrace` by default. You can pass return_inferencedata=True or return_inferencedata=False to be safe and silence this warning.
  
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [sigma, bW, bS, a]

Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 12 seconds.


plot_linear_hdi(trace['a'], trace['bS'], trace['sigma'], np.linspace(-2, 2, num=30))

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,
/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,


import pandas as pd
lds_df = pd.read_csv('data/lds.tsv', sep='\t')#.set_index('Rank')
divorce_df = pd.read_csv('data/WaffleDivorce.csv', sep=';').rename(columns={'Location':'State'})


df = divorce_df[['State', 'MedianAgeMarriage', 'Marriage', 'Divorce']].merge(lds_df[['State', 'Percentage of Mormon Residents']], on='State')


df['lds'] = df['Percentage of Mormon Residents'].apply(lambda x: float(x[:-1]))


def standardize(col):
    return (col - col.mean()) / col.std()


df['L_std'] = standardize(df['lds'])
df['M_std'] = standardize(df['Marriage'])
df['A_std'] = standardize(df['MedianAgeMarriage'])
df['D_std'] = standardize(df['Divorce'])


with pm.Model() as m:
    a = pm.Normal('a', 0, 0.2)
    bM = pm.Normal('bM', 0, 1)
    bA = pm.Normal('bA', 0, 1)
    bL = pm.Normal('bL', 0, 1)
    sigma = pm.Exponential('sigma', 1)
    mu = a + bM*df['M_std'] + bA*df['A_std'] + bL*df['L_std']
    grade = pm.Normal('grade', mu, sigma, observed=df['D_std'])


with m:
    prior_check = pm.sample_prior_predictive(samples=50)
plot_predictive(prior_check, 'a', 'bM')
plot_predictive(prior_check, 'a', 'bA')
plot_predictive(prior_check, 'a', 'bL')


with m:
    trace = pm.sample(1000, tune=1000)

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/ipykernel_launcher.py:2: FutureWarning: In v4.0, pm.sample will return an `arviz.InferenceData` object instead of a `MultiTrace` by default. You can pass return_inferencedata=True or return_inferencedata=False to be safe and silence this warning.
  
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [sigma, bL, bA, bM, a]

Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 11 seconds.


plot_linear_hdi(trace['a'], trace['bM'], trace['sigma'], np.linspace(-2, 2, num=30))

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,
/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,


plot_linear_hdi(trace['a'], trace['bA'], trace['sigma'], np.linspace(-2, 2, num=30))

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,
/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,


plot_linear_hdi(trace['a'], trace['bL'], trace['sigma'], np.linspace(-2, 2, num=30))

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,
/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,


with pm.Model() as m:
    a = pm.Normal('a', 0, 0.2)
    bM = pm.Normal('bM', 0, 1)
    bA = pm.Normal('bA', 0, 1)
    sigma = pm.Exponential('sigma', 1)
    mu = a + bM*df['M_std'] + bA*df['A_std']
    grade = pm.Normal('grade', mu, sigma, observed=df['D_std'])


with m:
    trace = pm.sample(1000, tune=1000)

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/ipykernel_launcher.py:2: FutureWarning: In v4.0, pm.sample will return an `arviz.InferenceData` object instead of a `MultiTrace` by default. You can pass return_inferencedata=True or return_inferencedata=False to be safe and silence this warning.
  
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [sigma, bL, bA, bM, a]

Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 12 seconds.


plot_linear_hdi(trace['a'], trace['bM'], trace['sigma'], np.linspace(-2, 2, num=30))

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,
/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,


with pm.Model() as m:
    a = pm.Normal('a', 0, 0.2)
    bM = pm.Normal('bM', 0, 1)
    sigma = pm.Exponential('sigma', 1)
    mu = a + bM*df['M_std']
    grade = pm.Normal('grade', mu, sigma, observed=df['D_std'])


with m:
    trace = pm.sample(1000, tune=1000)

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/ipykernel_launcher.py:2: FutureWarning: In v4.0, pm.sample will return an `arviz.InferenceData` object instead of a `MultiTrace` by default. You can pass return_inferencedata=True or return_inferencedata=False to be safe and silence this warning.
  
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [sigma, bM, a]

Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 12 seconds.


plot_linear_hdi(trace['a'], trace['bM'], trace['sigma'], np.linspace(-2, 2, num=30))

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,
/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,


#We want to regress M on and A and A on D
from theano import shared


marriage_shared = shared(df['M_std'].values)


marriage_shared

<TensorType(float64, vector)>


with pm.Model() as m:
    sigmaA = pm.Exponential('sigmaA', 1)
    bMA = pm.Normal('bMA', 0, 0.5)
    aA = pm.Normal('aA', 0, 0.2)
    muA = aA + bMA*marriage_shared
    age = pm.Normal('age', muA, sigmaA, observed=df['A_std'])
    
    #sigmaD = pm.Exponential('sigmaD', 1)
    #bAD = pm.Normal('bAD', 0, 0.5)
    #aD = pm.Normal('aD', 0, 0.2)
    #muD = a + bMA*df['A_std']
    #divorce = pm.Normal('divorce', muD, sigmaD, observed=df['D_std'])
    
    trace = pm.sample()

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/ipykernel_launcher.py:14: FutureWarning: In v4.0, pm.sample will return an `arviz.InferenceData` object instead of a `MultiTrace` by default. You can pass return_inferencedata=True or return_inferencedata=False to be safe and silence this warning.
  
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [aA, bMA, sigmaA]

Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 10 seconds.


az.summary(trace)

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/data/io_pymc3.py:100: FutureWarning: Using `from_pymc3` without the model will be deprecated in a future release. Not using the model will return less accurate and less useful results. Make sure you use the model argument or call from_pymc3 within a model context.
  FutureWarning,


df.columns

Index(['State', 'MedianAgeMarriage', 'Marriage', 'Divorce',
       'Percentage of Mormon Residents', 'lds', 'L_std', 'M_std', 'A_std',
       'D_std'],
      dtype='object')


df['Marriage'].mean()

20.114000000000004


half_mean_marriage = df['Marriage'].mean() / 2


half_mean_marriage_std = (half_mean_marriage - df['Marriage'].mean()) / df['Marriage'].std()


half_mean_marriage_std

-2.648038547766006


M_seq = np.linspace(-2.6481, 2.75)


marriage_shared.set_value(M_seq)


with m:
    age_preds = pm.sample_posterior_predictive(trace)


age_preds['age'].shape

(4000, 50)


az.plot_hdi(M_seq, age_preds["age"])
plt.ylabel('A')
plt.xlabel('M')

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,

Text(0.5, 0, 'M')


age_preds['age'].mean(axis=0)

array([ 1.82258725,  1.74722879,  1.69594008,  1.59595079,  1.53130463,
        1.44288663,  1.3788489 ,  1.28841831,  1.19600307,  1.16037222,
        1.0567193 ,  0.99219142,  0.92500769,  0.83476246,  0.7901532 ,
        0.68934497,  0.61405479,  0.51618051,  0.4541858 ,  0.39844071,
        0.32462541,  0.22467922,  0.14721737,  0.06654621,  0.02264443,
       -0.06489612, -0.14521053, -0.2261938 , -0.28482633, -0.36421791,
       -0.4595846 , -0.53383907, -0.61651814, -0.67276719, -0.75118787,
       -0.81289754, -0.90523969, -0.97735656, -1.07687552, -1.14962839,
       -1.23666578, -1.27954765, -1.37911201, -1.43973569, -1.5180104 ,
       -1.61901208, -1.67322697, -1.75171885, -1.8183646 , -1.91819972])


# The first mean will correspond to the counterfactual age if we set the mean marriage rate to half of the current one.
age = age_preds['age'].mean(axis=0)[0]


# What age does that std correspond to?
age * df['MedianAgeMarriage'].std() + df['MedianAgeMarriage'].mean()

28.32062472736527


df.columns

Index(['State', 'MedianAgeMarriage', 'Marriage', 'Divorce',
       'Percentage of Mormon Residents', 'lds', 'L_std', 'M_std', 'A_std',
       'D_std'],
      dtype='object')


df['MedianAgeMarriage'].mean()

26.053999999999995


# Now we'll learn how median age at marriage indicates divorce rate, before substituting in the age we would have if the marriage rate were halved.


age_shared = shared(df['A_std'].values)


with pm.Model() as m:
    
    sigmaD = pm.Exponential('sigmaD', 1)
    bAD = pm.Normal('bAD', 0, 0.5)
    aD = pm.Normal('aD', 0, 0.2)
    muD = aD + bAD*age_shared
    divorce = pm.Normal('divorce', muD, sigmaD, observed=df['D_std'])
    
    trace = pm.sample()

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/ipykernel_launcher.py:9: FutureWarning: In v4.0, pm.sample will return an `arviz.InferenceData` object instead of a `MultiTrace` by default. You can pass return_inferencedata=True or return_inferencedata=False to be safe and silence this warning.
  if __name__ == '__main__':
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [aD, bAD, sigmaD]

Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 12 seconds.


az.summary(trace)

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/data/io_pymc3.py:100: FutureWarning: Using `from_pymc3` without the model will be deprecated in a future release. Not using the model will return less accurate and less useful results. Make sure you use the model argument or call from_pymc3 within a model context.
  FutureWarning,


age_shared.set_value(np.array([age]))


with m:
    divorce_preds = pm.sample_posterior_predictive(trace)


divorce_preds['divorce']

(4000, 50)


age_shared

<TensorType(float64, vector)>


divorce_preds['divorce'].mean()

-1.034228285082771


divorce_preds['divorce'].mean() * df['Divorce'].std() + df['Divorce'].mean()

7.80486276079621


df['Divorce'].mean()

9.688


import pandas as pd
import numpy as np


df = pd.read_csv('data/milk.csv', sep=';')


df['K'] = (df['kcal.per.g'] - df['kcal.per.g'].mean()) / df['kcal.per.g'].std()
df['N'] = (df['neocortex.perc'] - df['neocortex.perc'].mean()) / df['neocortex.perc'].std()
df['M'] = (np.log(df['mass']) - np.log(df['mass']).mean()) / np.log(df['mass']).std()


# Drop NaN values
df = df.dropna()

df


import arviz as az
import pymc3 as pm
from theano import shared


mass_shared = shared(df['M'].values)
neocortex_shared = shared(df['N'].values)


with pm.Model() as m:
 
    # M -> N
    sigmaN = pm.Exponential('sigmaN', 1)
    aN = pm.Normal('aM', 0, 0.2)
    bMN = pm.Normal('bMN', 0, 0.5)
    muN = aN + bMN*mass_shared
    neocortex = pm.Normal('neocortex', muN, sigmaN, observed=df['N'])
    
    # M -> K <- N
    sigmaK = pm.Exponential('sigmaK', 1)
    aK = pm.Normal('aK', 0, 0.2)
    bNK = pm.Normal('bNK', 0, 0.5)
    bMK = pm.Normal('bMK', 0, 0.5)
    muK = aK + bNK*neocortex_shared + bMK*mass_shared
    kcal = pm.Normal('kcal', muK, sigmaK, observed=df['K'])

    
    trace = pm.sample()

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/ipykernel_launcher.py:19: FutureWarning: In v4.0, pm.sample will return an `arviz.InferenceData` object instead of a `MultiTrace` by default. You can pass return_inferencedata=True or return_inferencedata=False to be safe and silence this warning.
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [bMK, bNK, aK, sigmaK, bMN, aM, sigmaN]

Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 12 seconds.


az.summary(trace)

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/data/io_pymc3.py:100: FutureWarning: Using `from_pymc3` without the model will be deprecated in a future release. Not using the model will return less accurate and less useful results. Make sure you use the model argument or call from_pymc3 within a model context.
  FutureWarning,


mass_linspace = np.linspace(df['mass'].min(), df['mass'].max(), 17)


mass_log_linspace = np.log(mass_linspace)
mass_shared.set_value(mass_log_linspace)


#mass_counterfactual = np.linspace(-2, 2, 17)
#mass_shared.set_value(mass_counterfactual)


with m:
    m_neocortex = pm.sample_posterior_predictive(trace)


import matplotlib.pyplot as plt


_, ax = plt.subplots(1, 2, figsize=(12, 4))
az.plot_hdi(mass_linspace, m_neocortex["kcal"], ax=ax[0])
ax[0].plot(mass_linspace, m_neocortex["kcal"].mean(0))
ax[0].set_title("Total counterfactual effect of M on K")
ax[0].set_xlabel("manipulated M")
ax[0].set_ylabel("counterfactual K")


az.plot_hdi(mass_linspace, m_neocortex["neocortex"], ax=ax[1])
ax[1].plot(mass_linspace, m_neocortex["neocortex"].mean(0))
ax[1].set_title("Total counterfactual effect of M -> N")
ax[1].set_xlabel("manipulated M")
ax[1].set_ylabel("counterfactual N");

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,
/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,


# There's a non-linear relationship, but the above left plot shows how changing the mass affects the kcal per gram of milk.


# Is this really using the simulated effect on N in the prediction of K though? We can get an answer to this by using two separate models


mass_shared = shared(df['M'].values)
neocortex_shared = shared(df['N'].values)


with pm.Model() as m_MN:
    # M -> N
    sigmaN = pm.Exponential('sigmaN', 1)
    aN = pm.Normal('aM', 0, 0.2)
    bMN = pm.Normal('bMN', 0, 0.5)
    muN = aN + bMN*mass_shared
    neocortex = pm.Normal('neocortex', muN, sigmaN, observed=df['N'])
    
    trace_MN = pm.sample()

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/ipykernel_launcher.py:9: FutureWarning: In v4.0, pm.sample will return an `arviz.InferenceData` object instead of a `MultiTrace` by default. You can pass return_inferencedata=True or return_inferencedata=False to be safe and silence this warning.
  if __name__ == '__main__':
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [bMN, aM, sigmaN]

Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 11 seconds.


with pm.Model() as m_MNK:
    # M -> K <- N
    sigmaK = pm.Exponential('sigmaK', 1)
    aK = pm.Normal('aK', 0, 0.2)
    bNK = pm.Normal('bNK', 0, 0.5)
    bMK = pm.Normal('bMK', 0, 0.5)
    muK = aK + bNK*neocortex_shared + bMK*mass_shared
    kcal = pm.Normal('kcal', muK, sigmaK, observed=df['K'])
    
    trace_MNK = pm.sample()

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/ipykernel_launcher.py:10: FutureWarning: In v4.0, pm.sample will return an `arviz.InferenceData` object instead of a `MultiTrace` by default. You can pass return_inferencedata=True or return_inferencedata=False to be safe and silence this warning.
  # Remove the CWD from sys.path while we load stuff.
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [bMK, bNK, aK, sigmaK]

Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 11 seconds.


mass_linspace = np.linspace(df['mass'].min(), df['mass'].max(), 17)
mass_log_linspace = np.log(mass_linspace)
mass_shared.set_value(mass_log_linspace)


with m_MN:
    ppc_MN = pm.sample_posterior_predictive(trace_MN)


ppc_MN['neocortex'].shape

(4000, 17)


neocortex_shared.set_value(ppc_MN['neocortex'].mean(axis=0))


with m_MNK:
    ppc_MNK = pm.sample_posterior_predictive(trace_MNK)


_, ax = plt.subplots(1, 2, figsize=(12, 4))
az.plot_hdi(mass_linspace, ppc_MNK["kcal"], ax=ax[0])
ax[0].plot(mass_linspace, ppc_MNK["kcal"].mean(0))
ax[0].set_title("Total counterfactual effect of M on K")
ax[0].set_xlabel("manipulated M")
ax[0].set_ylabel("counterfactual K")


az.plot_hdi(mass_linspace, ppc_MN["neocortex"], ax=ax[1])
ax[1].plot(mass_linspace, ppc_MN["neocortex"].mean(0))
ax[1].set_title("Total counterfactual effect of M -> N")
ax[1].set_xlabel("manipulated M")
ax[1].set_ylabel("counterfactual N");

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,
/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,


# Yeah, so there's a difference. the pymc-devs code for chapter 5 might be incorrect.


import pandas as pd
divorce_df = pd.read_csv('data/WaffleDivorce.csv', sep=';').rename(columns={'Location':'State'})
df = divorce_df


df['M_std'] = standardize(df['Marriage'])
df['A_std'] = standardize(df['MedianAgeMarriage'])
df['D_std'] = standardize(df['Divorce'])


df.head()


# First regress S on D
with pm.Model() as m:
    sigma = pm.Exponential('sigma', 1)
    bS = pm.Normal('bS', 0, 0.5, shape=2)
    mu = bS[df['South']]
    divorce = pm.Normal('divorce', mu, sigma, observed=df['D_std'])


with m:
    prior_check = pm.sample_prior_predictive()


az.plot_ppc(az.from_pymc3(posterior_predictive=prior_check, model=m));


with m:
    trace = pm.sample()

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/ipykernel_launcher.py:2: FutureWarning: In v4.0, pm.sample will return an `arviz.InferenceData` object instead of a `MultiTrace` by default. You can pass return_inferencedata=True or return_inferencedata=False to be safe and silence this warning.
  
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [bS, sigma]

Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 14 seconds.


az.plot_trace(trace)

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/data/io_pymc3.py:100: FutureWarning: Using `from_pymc3` without the model will be deprecated in a future release. Not using the model will return less accurate and less useful results. Make sure you use the model argument or call from_pymc3 within a model context.
  FutureWarning,

array([[<AxesSubplot:title={'center':'bS'}>,
        <AxesSubplot:title={'center':'bS'}>],
       [<AxesSubplot:title={'center':'sigma'}>,
        <AxesSubplot:title={'center':'sigma'}>]], dtype=object)


az.summary(trace)

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/data/io_pymc3.py:100: FutureWarning: Using `from_pymc3` without the model will be deprecated in a future release. Not using the model will return less accurate and less useful results. Make sure you use the model argument or call from_pymc3 within a model context.
  FutureWarning,


with pm.Model() as m:
    sigma = pm.Exponential('sigma', 1)
    bA = pm.Normal('bA', 0, 0.5, shape=2)
    a = pm.Normal('a', 0, 0.2, shape=2)
    mu = a[df['South']] + bA[df['South']]*df['A_std']
    divorce = pm.Normal('divorce', mu, sigma, observed=df['D_std'])


with m:
    prior_check = pm.sample_prior_predictive()


plot_linear_hdi(prior_check['a'][:, 0], prior_check['bA'][:, 0], prior_check['sigma'], np.linspace(-2, 2, num=30))

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,
/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,


plot_linear_hdi(prior_check['a'][:, 1], prior_check['bA'][:, 1], prior_check['sigma'], np.linspace(-2, 2, num=30))

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,
/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,


with m:
    trace = pm.sample()

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/ipykernel_launcher.py:2: FutureWarning: In v4.0, pm.sample will return an `arviz.InferenceData` object instead of a `MultiTrace` by default. You can pass return_inferencedata=True or return_inferencedata=False to be safe and silence this warning.
  
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [a, bA, sigma]

Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 14 seconds.


az.summary(trace)

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/data/io_pymc3.py:100: FutureWarning: Using `from_pymc3` without the model will be deprecated in a future release. Not using the model will return less accurate and less useful results. Make sure you use the model argument or call from_pymc3 within a model context.
  FutureWarning,


az.plot_trace(trace)

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/data/io_pymc3.py:100: FutureWarning: Using `from_pymc3` without the model will be deprecated in a future release. Not using the model will return less accurate and less useful results. Make sure you use the model argument or call from_pymc3 within a model context.
  FutureWarning,

array([[<AxesSubplot:title={'center':'bA'}>,
        <AxesSubplot:title={'center':'bA'}>],
       [<AxesSubplot:title={'center':'a'}>,
        <AxesSubplot:title={'center':'a'}>],
       [<AxesSubplot:title={'center':'sigma'}>,
        <AxesSubplot:title={'center':'sigma'}>]], dtype=object)


plot_linear_hdi(trace['a'][:, 1], trace['bA'][:, 1], trace['sigma'], np.linspace(-2, 2, num=30))

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,
/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,


plot_linear_hdi(trace['a'][:, 0], trace['bA'][:, 0], trace['sigma'], np.linspace(-2, 2, num=30))

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,
/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,


with pm.Model() as m:
    sigma = pm.Exponential('sigma', 1)
    bS = pm.Normal('bS', 0, 0.5)
    a = pm.Normal('a', 0, 0.2)
    mu = a + bS*df['South']
    divorce = pm.Normal('divorce', mu, sigma, observed=df['D_std'])


with m:
    prior_check = pm.sample_prior_predictive()


plot_linear_hdi(prior_check['a'], prior_check['bS'], prior_check['sigma'], np.linspace(-2, 2, num=30))

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,
/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,


with m:
    trace = pm.sample()

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/ipykernel_launcher.py:2: FutureWarning: In v4.0, pm.sample will return an `arviz.InferenceData` object instead of a `MultiTrace` by default. You can pass return_inferencedata=True or return_inferencedata=False to be safe and silence this warning.
  
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [a, bS, sigma]

Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 13 seconds.


az.summary(trace)

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/data/io_pymc3.py:100: FutureWarning: Using `from_pymc3` without the model will be deprecated in a future release. Not using the model will return less accurate and less useful results. Make sure you use the model argument or call from_pymc3 within a model context.
  FutureWarning,


az.plot_trace(trace)

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/data/io_pymc3.py:100: FutureWarning: Using `from_pymc3` without the model will be deprecated in a future release. Not using the model will return less accurate and less useful results. Make sure you use the model argument or call from_pymc3 within a model context.
  FutureWarning,

array([[<AxesSubplot:title={'center':'bS'}>,
        <AxesSubplot:title={'center':'bS'}>],
       [<AxesSubplot:title={'center':'a'}>,
        <AxesSubplot:title={'center':'a'}>],
       [<AxesSubplot:title={'center':'sigma'}>,
        <AxesSubplot:title={'center':'sigma'}>]], dtype=object)


plot_linear_hdi(trace['a'], trace['bS'], trace['sigma'], np.linspace(-2, 2, num=30))

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,
/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,


with pm.Model() as m:
    sigma = pm.Exponential('sigma', 1)
    bS = pm.Normal('bS', 0, 0.5)
    bA = pm.Normal('bA', 0, 0.5)
    a = pm.Normal('a', 0, 0.2)
    mu = a + bS*df['South'] + bA*df['A_std']
    divorce = pm.Normal('divorce', mu, sigma, observed=df['D_std'])


with m:
    prior_check = pm.sample_prior_predictive()


plot_linear_hdi(prior_check['a'], prior_check['bA'], prior_check['sigma'], np.linspace(-2, 2, num=30))

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,
/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,


with m:
    trace = pm.sample()

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/ipykernel_launcher.py:2: FutureWarning: In v4.0, pm.sample will return an `arviz.InferenceData` object instead of a `MultiTrace` by default. You can pass return_inferencedata=True or return_inferencedata=False to be safe and silence this warning.
  
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [a, bA, bS, sigma]

Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 14 seconds.


az.summary(trace)

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/data/io_pymc3.py:100: FutureWarning: Using `from_pymc3` without the model will be deprecated in a future release. Not using the model will return less accurate and less useful results. Make sure you use the model argument or call from_pymc3 within a model context.
  FutureWarning,


az.plot_trace(trace)

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/data/io_pymc3.py:100: FutureWarning: Using `from_pymc3` without the model will be deprecated in a future release. Not using the model will return less accurate and less useful results. Make sure you use the model argument or call from_pymc3 within a model context.
  FutureWarning,

array([[<AxesSubplot:title={'center':'bS'}>,
        <AxesSubplot:title={'center':'bS'}>],
       [<AxesSubplot:title={'center':'bA'}>,
        <AxesSubplot:title={'center':'bA'}>],
       [<AxesSubplot:title={'center':'a'}>,
        <AxesSubplot:title={'center':'a'}>],
       [<AxesSubplot:title={'center':'sigma'}>,
        <AxesSubplot:title={'center':'sigma'}>]], dtype=object)


plot_linear_hdi(trace['a'], trace['bS'], trace['sigma'], np.linspace(-2, 2, num=30))

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,
/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,


with pm.Model() as m:
    sigma = pm.Exponential('sigma', 1)
    bS = pm.Normal('bS', 0, 0.5)
    bA = pm.Normal('bA', 0, 0.5)
    bM = pm.Normal('bM', 0, 0.5)
    a = pm.Normal('a', 0, 0.2)
    mu = a + bS*df['South'] + bA*df['A_std'] + bM*df['M_std']
    divorce = pm.Normal('divorce', mu, sigma, observed=df['D_std'])


with m:
    trace = pm.sample()

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/ipykernel_launcher.py:2: FutureWarning: In v4.0, pm.sample will return an `arviz.InferenceData` object instead of a `MultiTrace` by default. You can pass return_inferencedata=True or return_inferencedata=False to be safe and silence this warning.
  
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [a, bM, bA, bS, sigma]

Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 14 seconds.


az.plot_trace(trace)

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/data/io_pymc3.py:100: FutureWarning: Using `from_pymc3` without the model will be deprecated in a future release. Not using the model will return less accurate and less useful results. Make sure you use the model argument or call from_pymc3 within a model context.
  FutureWarning,

array([[<AxesSubplot:title={'center':'bS'}>,
        <AxesSubplot:title={'center':'bS'}>],
       [<AxesSubplot:title={'center':'bA'}>,
        <AxesSubplot:title={'center':'bA'}>],
       [<AxesSubplot:title={'center':'bM'}>,
        <AxesSubplot:title={'center':'bM'}>],
       [<AxesSubplot:title={'center':'a'}>,
        <AxesSubplot:title={'center':'a'}>],
       [<AxesSubplot:title={'center':'sigma'}>,
        <AxesSubplot:title={'center':'sigma'}>]], dtype=object)


az.summary(trace)

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/data/io_pymc3.py:100: FutureWarning: Using `from_pymc3` without the model will be deprecated in a future release. Not using the model will return less accurate and less useful results. Make sure you use the model argument or call from_pymc3 within a model context.
  FutureWarning,


plot_linear_hdi(trace['a'], trace['bS'], trace['sigma'], np.linspace(-2, 2, num=30))

/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,
/Users/oadams/code/oadams.github.io/statistical_rethinking_solutions/venv/lib/python3.7/site-packages/arviz/stats/stats.py:459: FutureWarning: hdi currently interprets 2d data as (draw, shape) but this will change in a future release to (chain, draw) for coherence with other functions
  FutureWarning,

	mean	sd	hdi_3%	hdi_97%	mcse_mean	mcse_sd	ess_bulk	ess_tail	r_hat
bMA	-0.691	0.103	-0.877	-0.494	0.001	0.001	5432.0	2847.0	1.0
aA	0.001	0.091	-0.170	0.173	0.001	0.001	5591.0	3065.0	1.0
sigmaA	0.713	0.075	0.583	0.852	0.001	0.001	5445.0	2973.0	1.0

	mean	sd	hdi_3%	hdi_97%	mcse_mean	mcse_sd	ess_bulk	ess_tail	r_hat
bAD	-0.566	0.118	-0.800	-0.365	0.002	0.001	5342.0	2987.0	1.0
aD	0.000	0.102	-0.193	0.191	0.002	0.002	4472.0	2696.0	1.0
sigmaD	0.823	0.086	0.668	0.986	0.001	0.001	4726.0	2714.0	1.0

	clade	species	kcal.per.g	perc.fat	perc.protein	perc.lactose	mass	neocortex.perc	K	N	M
0	Strepsirrhine	Eulemur fulvus	0.49	16.60	15.42	67.98	1.95	55.16	-0.940041	-2.080196	-0.455836
5	New World Monkey	Alouatta seniculus	0.47	21.22	23.58	55.20	5.25	64.54	-1.063955	-0.508641	0.127441
6	New World Monkey	A palliata	0.56	29.66	23.46	46.88	5.37	64.54	-0.506340	-0.508641	0.140751
7	New World Monkey	Cebus apella	0.89	53.41	15.80	30.79	2.51	67.64	1.538249	0.010742	-0.307158
9	New World Monkey	S sciureus	0.92	50.58	22.33	27.09	0.68	68.85	1.724120	0.213470	-1.076270
10	New World Monkey	Cebuella pygmaea	0.80	41.35	20.85	37.80	0.12	58.85	0.980633	-1.461962	-2.097830
11	New World Monkey	Callimico goeldii	0.46	3.93	25.30	70.77	0.47	61.69	-1.125913	-0.986139	-1.293797
12	New World Monkey	Callithrix jacchus	0.71	38.38	20.09	41.53	0.32	60.32	0.423018	-1.215673	-1.520189
15	Old World Monkey	Miopithecus talpoin	0.68	40.15	18.08	41.77	1.55	69.97	0.237147	0.401118	-0.591039
17	Old World Monkey	M mulatta	0.97	55.51	13.17	31.32	3.24	70.41	2.033906	0.474837	-0.156810
19	Old World Monkey	Papio spp	0.84	54.31	10.97	34.72	12.30	73.40	1.228462	0.975791	0.628840
21	Ape	Hylobates lar	0.62	34.51	12.57	52.92	5.37	67.53	-0.134597	-0.007687	0.140751
23	Ape	Pongo pygmaeus	0.54	37.78	7.37	54.85	35.48	71.26	-0.630255	0.617249	1.252735
24	Ape	Gorilla gorilla gorilla	0.49	27.18	16.29	56.53	79.43	72.60	-0.940041	0.841756	1.727359
26	Ape	Pan paniscus	0.48	21.18	11.68	67.14	40.74	70.24	-1.001998	0.446355	1.334150
27	Ape	P troglodytes	0.55	36.84	9.54	53.62	33.11	76.30	-0.568297	1.461666	1.212020
28	Ape	Homo sapiens	0.71	50.49	9.84	39.67	54.95	75.49	0.423018	1.325956	1.510366

	mean	sd	hdi_3%	hdi_97%	mcse_mean	mcse_sd	ess_bulk	ess_tail	r_hat
aM	-0.013	0.131	-0.263	0.223	0.002	0.002	4112.0	2552.0	1.0
bMN	0.603	0.151	0.323	0.888	0.003	0.002	3678.0	2550.0	1.0
aK	0.057	0.148	-0.231	0.327	0.002	0.002	4057.0	2895.0	1.0
bNK	0.602	0.286	0.106	1.157	0.005	0.004	3006.0	2921.0	1.0
bMK	-0.643	0.252	-1.108	-0.165	0.005	0.004	2510.0	2712.0	1.0
sigmaN	0.714	0.137	0.501	0.985	0.002	0.002	3617.0	2770.0	1.0
sigmaK	0.871	0.180	0.571	1.212	0.003	0.002	2993.0	2382.0	1.0

	State	Loc	Population	MedianAgeMarriage	Marriage	Marriage SE	Divorce	Divorce SE	WaffleHouses	South	Slaves1860	Population1860	PropSlaves1860	M_std	A_std	D_std
0	Alabama	AL	4.78	25.3	20.2	1.27	12.7	0.79	128	1	435080	964201	0.45	0.022644	-0.606290	1.654205
1	Alaska	AK	0.71	25.2	26.0	2.93	12.5	2.05	0	0	0	0	0.00	1.549802	-0.686699	1.544364
2	Arizona	AZ	6.33	25.8	20.3	0.98	10.8	0.74	18	0	0	0	0.00	0.048974	-0.204241	0.610716
3	Arkansas	AR	2.92	24.3	26.4	1.70	13.5	1.22	41	1	111115	435450	0.26	1.655123	-1.410387	2.093569
4	California	CA	37.25	26.8	19.1	0.39	8.0	0.24	0	0	0	379994	0.00	-0.266989	0.599857	-0.927058

Statistical Rethinking: Chapter 5 Practice Answers¶

5E1¶

5E2¶

5E3¶

Model 1¶

Model 2¶

Model 3¶

5E4¶

5M1¶

5M2¶

5M3¶

5M4¶

5M5¶

5H1¶

3H2¶

5H3¶

3H4¶

Q: Do we want to have a separate slope that depends on the southernness?¶

	mean	sd	hdi_3%	hdi_97%	mcse_mean	mcse_sd	ess_bulk	ess_tail	r_hat
bS[0]	-0.194	0.156	-0.470	0.104	0.002	0.002	5073.0	2654.0	1.0
bS[1]	0.428	0.228	0.018	0.864	0.003	0.002	4891.0	2867.0	1.0
sigma	0.961	0.099	0.791	1.150	0.001	0.001	4775.0	2682.0	1.0

	mean	sd	hdi_3%	hdi_97%	mcse_mean	mcse_sd	ess_bulk	ess_tail	r_hat
bA[0]	-0.456	0.117	-0.661	-0.217	0.002	0.001	5250.0	3263.0	1.0
bA[1]	-0.911	0.296	-1.452	-0.347	0.005	0.003	4315.0	3570.0	1.0
a[0]	-0.102	0.111	-0.302	0.121	0.002	0.001	5121.0	3140.0	1.0
a[1]	0.089	0.155	-0.197	0.373	0.002	0.002	4232.0	3403.0	1.0
sigma	0.781	0.083	0.647	0.949	0.001	0.001	4606.0	2848.0	1.0

	mean	sd	hdi_3%	hdi_97%	mcse_mean	mcse_sd	ess_bulk	ess_tail	r_hat
bS	0.509	0.254	0.025	0.980	0.005	0.003	2922.0	2530.0	1.0
a	-0.095	0.126	-0.328	0.142	0.002	0.002	3203.0	2465.0	1.0
sigma	0.967	0.102	0.788	1.157	0.002	0.001	4184.0	2653.0	1.0

	mean	sd	hdi_3%	hdi_97%	mcse_mean	mcse_sd	ess_bulk	ess_tail	r_hat
bS	0.348	0.224	-0.068	0.776	0.004	0.003	2644.0	2874.0	1.0
bA	-0.528	0.114	-0.734	-0.311	0.002	0.001	3974.0	2630.0	1.0
a	-0.076	0.110	-0.282	0.132	0.002	0.002	3055.0	2978.0	1.0
sigma	0.804	0.085	0.663	0.973	0.001	0.001	4491.0	2756.0	1.0

	mean	sd	hdi_3%	hdi_97%	mcse_mean	mcse_sd	ess_bulk	ess_tail	r_hat
bS	0.339	0.227	-0.085	0.761	0.004	0.003	3003.0	3130.0	1.0
bA	-0.557	0.160	-0.881	-0.273	0.003	0.002	2570.0	2331.0	1.0
bM	-0.036	0.159	-0.330	0.258	0.003	0.002	2544.0	2696.0	1.0
a	-0.074	0.109	-0.280	0.125	0.002	0.001	3237.0	3082.0	1.0
sigma	0.813	0.085	0.664	0.973	0.001	0.001	3444.0	3130.0	1.0