import arviz as az
import numpy as np
import pandas as pd
import pymc as pm

from matplotlib import pyplot as plt


RANDOM_SEED = 8929
rng = np.random.default_rng(RANDOM_SEED)
az.style.use("arviz-darkgrid")


def simulate_ar(intercept, coef1, coef2, noise=0.3, *, warmup=10, steps=200):
    # We sample some extra warmup steps, to let the AR process stabilize
    draws = np.zeros(warmup + steps)
    # Initialize first draws at intercept
    draws[:2] = intercept
    for step in range(2, warmup + steps):
        draws[step] = (
            intercept
            + coef1 * draws[step - 1]
            + coef2 * draws[step - 2]
            + np.random.normal(0, noise)
        )
    # Discard the warmup draws
    return draws[warmup:]


# True parameters of the AR process
ar1_data = simulate_ar(10, -0.9, 0)

fig, ax = plt.subplots(figsize=(10, 3))
ax.set_title("Generated Autoregressive Timeseries", fontsize=15)
ax.plot(ar1_data);


## Set up a dictionary for the specification of our priors
## We set up the dictionary to specify size of the AR coefficients in
## case we want to vary the AR lags.
priors = {
    "coefs": {"mu": [10, 0.2], "sigma": [0.1, 0.1], "size": 2},
    "sigma": 8,
    "init": {"mu": 9, "sigma": 0.1, "size": 1},
}

## Initialise the model
with pm.Model() as AR:
    pass

## Define the time interval for fitting the data
t_data = list(range(len(ar1_data)))
## Add the time interval as a mutable coordinate to the model to allow for future predictions
AR.add_coord("obs_id", t_data, mutable=True)

with AR:
    ## Data containers to enable prediction
    t = pm.MutableData("t", t_data, dims="obs_id")
    y = pm.MutableData("y", ar1_data, dims="obs_id")

    # The first coefficient will be the constant term but we need to set priors for each coefficient in the AR process
    coefs = pm.Normal("coefs", priors["coefs"]["mu"], priors["coefs"]["sigma"])
    sigma = pm.HalfNormal("sigma", priors["sigma"])
    # We need one init variable for each lag, hence size is variable too
    init = pm.Normal.dist(
        priors["init"]["mu"], priors["init"]["sigma"], size=priors["init"]["size"]
    )
    # Steps of the AR model minus the lags required
    ar1 = pm.AR(
        "ar",
        coefs,
        sigma=sigma,
        init_dist=init,
        constant=True,
        steps=t.shape[0] - (priors["coefs"]["size"] - 1),
        dims="obs_id",
    )

    # The Likelihood
    outcome = pm.Normal("likelihood", mu=ar1, sigma=sigma, observed=y, dims="obs_id")
    ## Sampling
    idata_ar = pm.sample_prior_predictive()
    idata_ar.extend(pm.sample(2000, random_seed=100, target_accept=0.95))
    idata_ar.extend(pm.sample_posterior_predictive(idata_ar))

Sampling: [ar, coefs, likelihood, sigma]
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [coefs, sigma, ar]

Sampling 4 chains for 1_000 tune and 2_000 draw iterations (4_000 + 8_000 draws total) took 46 seconds.
Sampling: [likelihood]


idata_ar

<xarray.Dataset>
Dimensions:      (chain: 4, draw: 2000, coefs_dim_0: 2, obs_id: 200)
Coordinates:
  * chain        (chain) int64 0 1 2 3
  * draw         (draw) int64 0 1 2 3 4 5 6 ... 1994 1995 1996 1997 1998 1999
  * coefs_dim_0  (coefs_dim_0) int64 0 1
  * obs_id       (obs_id) int64 0 1 2 3 4 5 6 7 ... 193 194 195 196 197 198 199
Data variables:
    coefs        (chain, draw, coefs_dim_0) float64 9.784 -0.8044 ... -0.7937
    ar           (chain, draw, obs_id) float64 8.744 5.527 4.382 ... 5.203 5.425
    sigma        (chain, draw) float64 0.4881 0.5189 0.4896 ... 0.4919 0.536
Attributes:
    created_at:                 2022-11-09T13:37:35.440374
    arviz_version:              0.12.1
    inference_library:          pymc
    inference_library_version:  4.2.2
    sampling_time:              46.495951890945435
    tuning_steps:               1000

array([0, 1, 2, 3])

array([   0,    1,    2, ..., 1997, 1998, 1999])

array([0, 1])

array([  0,   1,   2,   3,   4,   5,   6,   7,   8,   9,  10,  11,  12,  13,
        14,  15,  16,  17,  18,  19,  20,  21,  22,  23,  24,  25,  26,  27,
        28,  29,  30,  31,  32,  33,  34,  35,  36,  37,  38,  39,  40,  41,
        42,  43,  44,  45,  46,  47,  48,  49,  50,  51,  52,  53,  54,  55,
        56,  57,  58,  59,  60,  61,  62,  63,  64,  65,  66,  67,  68,  69,
        70,  71,  72,  73,  74,  75,  76,  77,  78,  79,  80,  81,  82,  83,
        84,  85,  86,  87,  88,  89,  90,  91,  92,  93,  94,  95,  96,  97,
        98,  99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111,
       112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125,
       126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139,
       140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153,
       154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167,
       168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181,
       182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195,
       196, 197, 198, 199])

array([[[ 9.78424718, -0.80438722],
        [ 9.74703572, -0.83706764],
        [ 9.79944405, -0.79930181],
        ...,
        [ 9.53893097, -0.79144711],
        [ 9.59709183, -0.78652045],
        [ 9.73692629, -0.81651835]],

       [[ 9.74268028, -0.80803045],
        [ 9.79526179, -0.81136089],
        [ 9.7890239 , -0.82699725],
        ...,
        [ 9.86478399, -0.81825659],
        [ 9.56231758, -0.7842574 ],
        [ 9.91745608, -0.85332664]],

       [[ 9.86287461, -0.80656223],
        [ 9.7503848 , -0.78838031],
        [ 9.73456476, -0.82507864],
        ...,
        [ 9.67317157, -0.79964398],
        [ 9.72808985, -0.81919129],
        [ 9.79594168, -0.8316699 ]],

       [[ 9.66388511, -0.77070848],
        [ 9.81792066, -0.86152692],
        [ 9.76193626, -0.80400692],
        ...,
        [ 9.82540452, -0.82762375],
        [ 9.68635269, -0.81628275],
        [ 9.72849693, -0.79365451]]])

array([[[8.74352758, 5.52741943, 4.38191711, ..., 5.14480198,
         5.24617995, 5.41743901],
        [8.77550506, 4.90547857, 4.15303127, ..., 4.60138867,
         5.93864166, 4.59592892],
        [8.71329607, 5.52044291, 4.52511514, ..., 5.06972045,
         5.27857848, 5.00547222],
        ...,
        [8.88502664, 5.57377862, 3.89409635, ..., 5.59909617,
         5.32225401, 5.20482076],
        [8.55664857, 4.88659312, 4.38079346, ..., 4.83263795,
         5.33348824, 5.05874786],
        [8.76757844, 4.90809102, 4.54824247, ..., 5.25881292,
         6.12158758, 5.20176982]],

       [[8.86872656, 5.0022022 , 4.58149104, ..., 5.78242943,
         5.27274199, 5.02613374],
        [8.60545624, 5.36327142, 3.87549526, ..., 4.78169205,
         5.73215524, 4.94515273],
        [8.72934777, 5.23184664, 4.26631068, ..., 5.43608436,
         5.69109134, 4.9359198 ],
...
        [8.51872267, 5.67053018, 3.68091342, ..., 5.38074753,
         5.28068957, 4.81562403],
        [8.84368012, 5.00970368, 4.76789871, ..., 5.08216918,
         5.81855931, 5.10367318],
        [8.5910571 , 4.86528321, 4.36407615, ..., 5.52091691,
         5.53541407, 4.56811379]],

       [[8.8404785 , 5.25125451, 3.84738158, ..., 5.62313306,
         4.79819979, 5.02215709],
        [8.58596763, 5.2463655 , 4.40220118, ..., 4.7902282 ,
         5.66964292, 4.48441869],
        [8.60738243, 5.61050158, 4.28259516, ..., 5.1362292 ,
         5.91231786, 5.18238246],
        ...,
        [8.60479962, 5.23713291, 4.55945121, ..., 5.27873283,
         4.82834783, 6.02702215],
        [8.86453311, 5.38558531, 4.04103726, ..., 4.84883412,
         5.98583658, 4.13783256],
        [8.62106165, 5.49281595, 3.85385124, ..., 5.77014132,
         5.20270335, 5.42464754]]])

array([[0.48813477, 0.51890268, 0.48960848, ..., 0.51885326, 0.46876196,
        0.48209071],
       [0.52594341, 0.5199723 , 0.51310773, ..., 0.51786577, 0.51361691,
        0.54464582],
       [0.53240365, 0.51134871, 0.48844114, ..., 0.47774974, 0.4976345 ,
        0.51907641],
       [0.57185232, 0.50741003, 0.52455992, ..., 0.49067704, 0.49186708,
        0.53600122]])

<xarray.Dataset>
Dimensions:     (chain: 4, draw: 2000, obs_id: 200)
Coordinates:
  * chain       (chain) int64 0 1 2 3
  * draw        (draw) int64 0 1 2 3 4 5 6 ... 1994 1995 1996 1997 1998 1999
  * obs_id      (obs_id) int64 0 1 2 3 4 5 6 7 ... 193 194 195 196 197 198 199
Data variables:
    likelihood  (chain, draw, obs_id) float64 8.641 5.752 4.043 ... 5.464 5.011
Attributes:
    created_at:                 2022-11-09T13:37:51.112643
    arviz_version:              0.12.1
    inference_library:          pymc
    inference_library_version:  4.2.2

array([0, 1, 2, 3])


az.plot_trace(idata_ar, figsize=(10, 6), kind="rank_vlines");


az.summary(idata_ar, var_names=["~ar"])


fig, ax = plt.subplots(figsize=(10, 4))
idata_ar.posterior.ar.mean(["chain", "draw"]).plot(ax=ax, label="Posterior Mean AR level")
ax.plot(ar1_data, "o", color="black", markersize=2, label="Observed Data")
ax.legend()
ax.set_title("Fitted AR process\nand observed data");


prediction_length = 250
n = prediction_length - ar1_data.shape[0]
obs = list(range(prediction_length))
with AR:
    ## We need to have coords for the observations minus the lagged term to correctly centre the prediction step
    AR.add_coords({"obs_id_fut_1": range(ar1_data.shape[0] - 1, 250, 1)})
    AR.add_coords({"obs_id_fut": range(ar1_data.shape[0], 250, 1)})
    # condition on the learned values of the AR process
    # initialise the future AR process precisely at the last observed value in the AR process
    # using the special feature of the dirac delta distribution to be 0 everywhere else.
    ar1_fut = pm.AR(
        "ar1_fut",
        init_dist=pm.DiracDelta.dist(ar1[..., -1]),
        rho=coefs,
        sigma=sigma,
        constant=True,
        dims="obs_id_fut_1",
    )
    yhat_fut = pm.Normal("yhat_fut", mu=ar1_fut[1:], sigma=sigma, dims="obs_id_fut")
    # use the updated values and predict outcomes and probabilities:
    idata_preds = pm.sample_posterior_predictive(
        idata_ar, var_names=["likelihood", "yhat_fut"], predictions=True, random_seed=100
    )

Sampling: [ar1_fut, likelihood, yhat_fut]


pm.model_to_graphviz(AR)


idata_preds

<xarray.Dataset>
Dimensions:     (chain: 4, draw: 2000, obs_id: 200, obs_id_fut: 50)
Coordinates:
  * chain       (chain) int64 0 1 2 3
  * draw        (draw) int64 0 1 2 3 4 5 6 ... 1994 1995 1996 1997 1998 1999
  * obs_id      (obs_id) int64 0 1 2 3 4 5 6 7 ... 193 194 195 196 197 198 199
  * obs_id_fut  (obs_id_fut) int64 200 201 202 203 204 ... 245 246 247 248 249
Data variables:
    likelihood  (chain, draw, obs_id) float64 8.599 6.006 3.882 ... 5.206 5.22
    yhat_fut    (chain, draw, obs_id_fut) float64 6.495 5.331 ... 3.495 6.905
Attributes:
    created_at:                 2022-11-09T13:38:50.219240
    arviz_version:              0.12.1
    inference_library:          pymc
    inference_library_version:  4.2.2

array([0, 1, 2, 3])

array([   0,    1,    2, ..., 1997, 1998, 1999])

array([  0,   1,   2,   3,   4,   5,   6,   7,   8,   9,  10,  11,  12,  13,
        14,  15,  16,  17,  18,  19,  20,  21,  22,  23,  24,  25,  26,  27,
        28,  29,  30,  31,  32,  33,  34,  35,  36,  37,  38,  39,  40,  41,
        42,  43,  44,  45,  46,  47,  48,  49,  50,  51,  52,  53,  54,  55,
        56,  57,  58,  59,  60,  61,  62,  63,  64,  65,  66,  67,  68,  69,
        70,  71,  72,  73,  74,  75,  76,  77,  78,  79,  80,  81,  82,  83,
        84,  85,  86,  87,  88,  89,  90,  91,  92,  93,  94,  95,  96,  97,
        98,  99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111,
       112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125,
       126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139,
       140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153,
       154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167,
       168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181,
       182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195,
       196, 197, 198, 199])

array([200, 201, 202, 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213,
       214, 215, 216, 217, 218, 219, 220, 221, 222, 223, 224, 225, 226, 227,
       228, 229, 230, 231, 232, 233, 234, 235, 236, 237, 238, 239, 240, 241,
       242, 243, 244, 245, 246, 247, 248, 249])

array([[[8.59884897, 6.00604341, 3.88206887, ..., 4.98169029,
         5.40359092, 5.68191078],
        [8.79670654, 5.93529041, 4.40429365, ..., 5.01546634,
         4.43474002, 3.60012164],
        [8.56847869, 5.39800394, 3.88356292, ..., 4.63002488,
         5.01572423, 4.43078707],
        ...,
        [9.20136104, 4.57883509, 4.48042098, ..., 5.31498913,
         4.44754853, 4.55047726],
        [9.00546596, 5.50518055, 6.01138556, ..., 4.70408191,
         5.11675198, 5.62857239],
        [8.88946697, 5.24419495, 4.00156719, ..., 4.20165221,
         5.82695311, 5.21254244]],

       [[9.58466508, 4.26734586, 4.27939642, ..., 5.14275023,
         5.82883516, 5.43938218],
        [9.6388725 , 5.1134545 , 4.08002374, ..., 4.39881783,
         5.77437617, 5.18038996],
        [8.10630832, 5.11994266, 4.43082836, ..., 4.67106398,
         5.45678235, 4.86631852],
...
        [8.15595583, 5.20394562, 2.951609  , ..., 5.3213695 ,
         6.18673762, 4.1615559 ],
        [8.80889118, 4.55812225, 5.01817234, ..., 5.01598758,
         4.9526523 , 5.56593906],
        [8.61649003, 5.09371976, 4.18762361, ..., 5.47849819,
         5.13814072, 5.95369104]],

       [[9.16858942, 5.12279053, 3.36495293, ..., 6.11475246,
         4.69878594, 4.39136645],
        [8.4054303 , 4.92610756, 4.21464288, ..., 4.26666647,
         5.84868038, 4.81156007],
        [8.67098501, 5.30548722, 4.40671805, ..., 5.16418269,
         5.67730921, 5.38076556],
        ...,
        [8.274733  , 4.58119292, 5.12602147, ..., 5.09634608,
         4.50401847, 5.5991206 ],
        [8.64207991, 5.23009314, 3.9992984 , ..., 4.43087845,
         6.05891835, 4.42354604],
        [8.16730802, 5.70020461, 4.63431287, ..., 5.95958104,
         5.20641388, 5.21960772]]])

array([[[6.4953486 , 5.33147583, 6.98718248, ..., 6.36780178,
         5.19327288, 5.55648387],
        [6.35693501, 4.72419911, 6.34624456, ..., 6.34945251,
         2.44257016, 6.26709538],
        [6.41316592, 4.07332944, 6.75438993, ..., 3.94588935,
         5.45166734, 5.85294635],
        ...,
        [5.53022118, 3.81466774, 5.38812548, ..., 4.30277357,
         5.58011075, 4.3171974 ],
        [5.94471308, 3.53128884, 5.05963497, ..., 4.53589301,
         4.88987214, 5.09390923],
        [4.3616181 , 4.95844304, 5.64978963, ..., 5.81761355,
         5.16029723, 4.70581458]],

       [[4.78506671, 4.28035922, 4.18195535, ..., 6.33435425,
         5.15477639, 5.63097243],
        [5.6816181 , 5.56311808, 4.40708914, ..., 5.73869459,
         5.34695395, 4.84345455],
        [5.84512397, 5.51856095, 6.70363985, ..., 5.61478793,
         5.61052781, 4.7551204 ],
...
        [5.65597631, 4.89324145, 4.57705603, ..., 4.83832309,
         6.64658325, 3.62682651],
        [5.82433233, 4.10600282, 6.54642625, ..., 4.26288255,
         5.16459549, 5.82842815],
        [5.46029854, 5.90144111, 6.09288155, ..., 6.81420745,
         5.6433365 , 5.80063532]],

       [[5.46329009, 4.32768119, 7.01060984, ..., 7.33606912,
         4.79217401, 6.80963022],
        [5.64209241, 3.92499247, 6.18934625, ..., 5.4748427 ,
         4.45647414, 5.62512031],
        [4.40948812, 4.93112986, 6.26481676, ..., 5.87055775,
         3.87404467, 5.58124849],
        ...,
        [6.3038289 , 5.12722683, 5.24307923, ..., 4.31622093,
         5.74889202, 5.40140064],
        [6.05972035, 4.98366893, 5.07665905, ..., 6.3783536 ,
         4.17927265, 5.84074104],
        [6.19750378, 5.32128673, 5.88932402, ..., 5.47006247,
         3.49463187, 6.90531056]]])

<xarray.Dataset>
Dimensions:  (obs_id: 200)
Coordinates:
  * obs_id   (obs_id) int64 0 1 2 3 4 5 6 7 ... 192 193 194 195 196 197 198 199
Data variables:
    t        (obs_id) int32 0 1 2 3 4 5 6 7 ... 192 193 194 195 196 197 198 199
    y        (obs_id) float64 3.367 6.823 3.497 7.269 ... 5.155 5.519 4.693
Attributes:
    created_at:                 2022-11-09T13:38:50.221893
    arviz_version:              0.12.1
    inference_library:          pymc
    inference_library_version:  4.2.2

array([  0,   1,   2,   3,   4,   5,   6,   7,   8,   9,  10,  11,  12,  13,
        14,  15,  16,  17,  18,  19,  20,  21,  22,  23,  24,  25,  26,  27,
        28,  29,  30,  31,  32,  33,  34,  35,  36,  37,  38,  39,  40,  41,
        42,  43,  44,  45,  46,  47,  48,  49,  50,  51,  52,  53,  54,  55,
        56,  57,  58,  59,  60,  61,  62,  63,  64,  65,  66,  67,  68,  69,
        70,  71,  72,  73,  74,  75,  76,  77,  78,  79,  80,  81,  82,  83,
        84,  85,  86,  87,  88,  89,  90,  91,  92,  93,  94,  95,  96,  97,
        98,  99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111,
       112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125,
       126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139,
       140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153,
       154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167,
       168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181,
       182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195,
       196, 197, 198, 199])

array([  0,   1,   2,   3,   4,   5,   6,   7,   8,   9,  10,  11,  12,
        13,  14,  15,  16,  17,  18,  19,  20,  21,  22,  23,  24,  25,
        26,  27,  28,  29,  30,  31,  32,  33,  34,  35,  36,  37,  38,
        39,  40,  41,  42,  43,  44,  45,  46,  47,  48,  49,  50,  51,
        52,  53,  54,  55,  56,  57,  58,  59,  60,  61,  62,  63,  64,
        65,  66,  67,  68,  69,  70,  71,  72,  73,  74,  75,  76,  77,
        78,  79,  80,  81,  82,  83,  84,  85,  86,  87,  88,  89,  90,
        91,  92,  93,  94,  95,  96,  97,  98,  99, 100, 101, 102, 103,
       104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116,
       117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129,
       130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142,
       143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155,
       156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168,
       169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181,
       182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194,
       195, 196, 197, 198, 199], dtype=int32)


def plot_fits(idata_ar, idata_preds):
    palette = "plasma"
    cmap = plt.get_cmap(palette)
    percs = np.linspace(51, 99, 100)
    colors = (percs - np.min(percs)) / (np.max(percs) - np.min(percs))
    mosaic = """AABB
                CCCC"""
    fig, axs = plt.subplot_mosaic(mosaic, sharex=False, figsize=(20, 10))
    axs = [axs[k] for k in axs.keys()]
    for i, p in enumerate(percs[::-1]):
        upper = np.percentile(
            az.extract_dataset(idata_ar, group="prior_predictive", num_samples=1000)["likelihood"],
            p,
            axis=1,
        )
        lower = np.percentile(
            az.extract_dataset(idata_ar, group="prior_predictive", num_samples=1000)["likelihood"],
            100 - p,
            axis=1,
        )
        color_val = colors[i]
        axs[0].fill_between(
            x=idata_ar["constant_data"]["t"],
            y1=upper.flatten(),
            y2=lower.flatten(),
            color=cmap(color_val),
            alpha=0.1,
        )

    axs[0].plot(
        az.extract_dataset(idata_ar, group="prior_predictive", num_samples=1000)["likelihood"].mean(
            axis=1
        ),
        color="cyan",
        label="Prior Predicted Mean Realisation",
    )

    axs[0].scatter(
        x=idata_ar["constant_data"]["t"],
        y=idata_ar["constant_data"]["y"],
        color="k",
        label="Observed Data points",
    )
    axs[0].set_title("Prior Predictive Fit", fontsize=20)
    axs[0].legend()

    for i, p in enumerate(percs[::-1]):
        upper = np.percentile(
            az.extract_dataset(idata_preds, group="predictions", num_samples=1000)["likelihood"],
            p,
            axis=1,
        )
        lower = np.percentile(
            az.extract_dataset(idata_preds, group="predictions", num_samples=1000)["likelihood"],
            100 - p,
            axis=1,
        )
        color_val = colors[i]
        axs[2].fill_between(
            x=idata_preds["predictions_constant_data"]["t"],
            y1=upper.flatten(),
            y2=lower.flatten(),
            color=cmap(color_val),
            alpha=0.1,
        )

        upper = np.percentile(
            az.extract_dataset(idata_preds, group="predictions", num_samples=1000)["yhat_fut"],
            p,
            axis=1,
        )
        lower = np.percentile(
            az.extract_dataset(idata_preds, group="predictions", num_samples=1000)["yhat_fut"],
            100 - p,
            axis=1,
        )
        color_val = colors[i]
        axs[2].fill_between(
            x=idata_preds["predictions"].coords["obs_id_fut"].data,
            y1=upper.flatten(),
            y2=lower.flatten(),
            color=cmap(color_val),
            alpha=0.1,
        )

    axs[2].plot(
        az.extract_dataset(idata_preds, group="predictions", num_samples=1000)["likelihood"].mean(
            axis=1
        ),
        color="cyan",
    )
    idata_preds.predictions.yhat_fut.mean(["chain", "draw"]).plot(
        ax=axs[2], color="cyan", label="Predicted Mean Realisation"
    )
    axs[2].scatter(
        x=idata_ar["constant_data"]["t"],
        y=idata_ar["constant_data"]["y"],
        color="k",
        label="Observed Data",
    )
    axs[2].set_title("Posterior Predictions Plotted", fontsize=20)
    axs[2].axvline(np.max(idata_ar["constant_data"]["t"]), color="black")
    axs[2].legend()
    axs[2].set_xlabel("Time in Days")
    axs[0].set_xlabel("Time in Days")
    az.plot_ppc(idata_ar, ax=axs[1])


plot_fits(idata_ar, idata_preds)


y_t = -0.3 + np.arange(200) * -0.2 + np.random.normal(0, 10, 200)
y_t = y_t + ar1_data

fig, ax = plt.subplots(figsize=(10, 4))
ax.plot(y_t)
ax.set_title("AR Process + Trend data");


def make_latent_AR_model(ar_data, priors, prediction_steps=250, full_sample=True, samples=2000):
    with pm.Model() as AR:
        pass

    t_data = list(range(len(ar_data)))
    AR.add_coord("obs_id", t_data, mutable=True)

    with AR:
        ## Data containers to enable prediction
        t = pm.MutableData("t", t_data, dims="obs_id")
        y = pm.MutableData("y", ar_data, dims="obs_id")
        # The first coefficient will be the intercept term
        coefs = pm.Normal("coefs", priors["coefs"]["mu"], priors["coefs"]["sigma"])
        sigma = pm.HalfNormal("sigma", priors["sigma"])
        # We need one init variable for each lag, hence size is variable too
        init = pm.Normal.dist(
            priors["init"]["mu"], priors["init"]["sigma"], size=priors["init"]["size"]
        )
        # Steps of the AR model minus the lags required given specification
        ar1 = pm.AR(
            "ar",
            coefs,
            sigma=sigma,
            init_dist=init,
            constant=True,
            steps=t.shape[0] - (priors["coefs"]["size"] - 1),
            dims="obs_id",
        )

        # The Likelihood
        outcome = pm.Normal("likelihood", mu=ar1, sigma=sigma, observed=y, dims="obs_id")
        ## Sampling
        idata_ar = pm.sample_prior_predictive()
        if full_sample:
            idata_ar.extend(pm.sample(samples, random_seed=100, target_accept=0.95))
            idata_ar.extend(pm.sample_posterior_predictive(idata_ar))
        else:
            return idata_ar

    n = prediction_steps - ar_data.shape[0]

    with AR:
        AR.add_coords({"obs_id_fut_1": range(ar1_data.shape[0] - 1, 250, 1)})
        AR.add_coords({"obs_id_fut": range(ar1_data.shape[0], 250, 1)})
        # condition on the learned values of the AR process
        # initialise the future AR process precisely at the last observed value in the AR process
        # using the special feature of the dirac delta distribution to be 0 probability everywhere else.
        ar1_fut = pm.AR(
            "ar1_fut",
            init_dist=pm.DiracDelta.dist(ar1[..., -1]),
            rho=coefs,
            sigma=sigma,
            constant=True,
            dims="obs_id_fut_1",
        )
        yhat_fut = pm.Normal("yhat_fut", mu=ar1_fut[1:], sigma=sigma, dims="obs_id_fut")
        # use the updated values and predict outcomes and probabilities:
        idata_preds = pm.sample_posterior_predictive(
            idata_ar, var_names=["likelihood", "yhat_fut"], predictions=True, random_seed=100
        )

    return idata_ar, idata_preds, AR


priors_0 = {
    "coefs": {"mu": [-4, 0.2], "sigma": 0.1, "size": 2},
    "sigma": 8,
    "init": {"mu": 9, "sigma": 0.1, "size": 1},
}

priors_1 = {
    "coefs": {"mu": [-2, 0.2], "sigma": 0.1, "size": 2},
    "sigma": 12,
    "init": {"mu": 8, "sigma": 0.1, "size": 1},
}

priors_2 = {
    "coefs": {"mu": [0, 0.2], "sigma": 0.1, "size": 2},
    "sigma": 15,
    "init": {"mu": 8, "sigma": 0.1, "size": 1},
}

models = {}
for i, p in enumerate([priors_0, priors_1, priors_2]):
    models[i] = {}
    idata = make_latent_AR_model(y_t, p, full_sample=False)
    models[i]["idata"] = idata

Sampling: [ar, coefs, likelihood, sigma]
Sampling: [ar, coefs, likelihood, sigma]
Sampling: [ar, coefs, likelihood, sigma]


fig, axs = plt.subplots(1, 3, figsize=(10, 4), sharey=True)
axs = axs.flatten()
for i, p in zip(range(3), [priors_0, priors_1, priors_2]):
    axs[i].plot(
        az.extract_dataset(models[i]["idata"], group="prior_predictive", num_samples=100)[
            "likelihood"
        ],
        color="blue",
        alpha=0.1,
    )
    axs[i].plot(y_t, "o", color="black", markersize=2)
    axs[i].set_title(
        "$y_{t+1}$" + f'= N({p["coefs"]["mu"][0]} + {p["coefs"]["mu"][1]}y$_t$, {p["sigma"]})'
    )
plt.suptitle("Prior Predictive Specifications", fontsize=20);


priors_0 = {
    "coefs": {"mu": [-4, 0.2], "sigma": [0.5, 0.03], "size": 2},
    "sigma": 8,
    "init": {"mu": -4, "sigma": 0.1, "size": 1},
}

idata_no_trend, preds_no_trend, model = make_latent_AR_model(y_t, priors_0)

Sampling: [ar, coefs, likelihood, sigma]
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [coefs, sigma, ar]

Sampling 4 chains for 1_000 tune and 2_000 draw iterations (4_000 + 8_000 draws total) took 49 seconds.
Sampling: [likelihood]

Sampling: [ar1_fut, likelihood, yhat_fut]


plot_fits(idata_no_trend, preds_no_trend)


def make_latent_AR_trend_model(
    ar_data, priors, prediction_steps=250, full_sample=True, samples=2000
):
    with pm.Model() as AR:
        pass

    t_data = list(range(len(ar_data)))
    AR.add_coord("obs_id", t_data, mutable=True)

    with AR:
        ## Data containers to enable prediction
        t = pm.MutableData("t", t_data, dims="obs_id")
        y = pm.MutableData("y", ar_data, dims="obs_id")
        # The first coefficient will be the intercept term
        coefs = pm.Normal("coefs", priors["coefs"]["mu"], priors["coefs"]["sigma"])
        sigma = pm.HalfNormal("sigma", priors["sigma"])
        # We need one init variable for each lag, hence size is variable too
        init = pm.Normal.dist(
            priors["init"]["mu"], priors["init"]["sigma"], size=priors["init"]["size"]
        )
        # Steps of the AR model minus the lags required given specification
        ar1 = pm.AR(
            "ar",
            coefs,
            sigma=sigma,
            init_dist=init,
            constant=True,
            steps=t.shape[0] - (priors["coefs"]["size"] - 1),
            dims="obs_id",
        )

        ## Priors for the linear trend component
        alpha = pm.Normal("alpha", priors["alpha"]["mu"], priors["alpha"]["sigma"])
        beta = pm.Normal("beta", priors["beta"]["mu"], priors["beta"]["sigma"])
        trend = pm.Deterministic("trend", alpha + beta * t, dims="obs_id")

        mu = ar1 + trend

        # The Likelihood
        outcome = pm.Normal("likelihood", mu=mu, sigma=sigma, observed=y, dims="obs_id")
        ## Sampling
        idata_ar = pm.sample_prior_predictive()
        if full_sample:
            idata_ar.extend(pm.sample(samples, random_seed=100, target_accept=0.95))
            idata_ar.extend(pm.sample_posterior_predictive(idata_ar))
        else:
            return idata_ar

    n = prediction_steps - ar_data.shape[0]

    with AR:
        AR.add_coords({"obs_id_fut_1": range(ar1_data.shape[0] - 1, prediction_steps, 1)})
        AR.add_coords({"obs_id_fut": range(ar1_data.shape[0], prediction_steps, 1)})
        t_fut = pm.MutableData("t_fut", list(range(ar1_data.shape[0], prediction_steps, 1)))
        # condition on the learned values of the AR process
        # initialise the future AR process precisely at the last observed value in the AR process
        # using the special feature of the dirac delta distribution to be 0 probability everywhere else.
        ar1_fut = pm.AR(
            "ar1_fut",
            init_dist=pm.DiracDelta.dist(ar1[..., -1]),
            rho=coefs,
            sigma=sigma,
            constant=True,
            dims="obs_id_fut_1",
        )
        trend = pm.Deterministic("trend_fut", alpha + beta * t_fut, dims="obs_id_fut")
        mu = ar1_fut[1:] + trend

        yhat_fut = pm.Normal("yhat_fut", mu=mu, sigma=sigma, dims="obs_id_fut")
        # use the updated values and predict outcomes and probabilities:
        idata_preds = pm.sample_posterior_predictive(
            idata_ar, var_names=["likelihood", "yhat_fut"], predictions=True, random_seed=100
        )

    return idata_ar, idata_preds, AR


priors_0 = {
    "coefs": {"mu": [0.2, 0.2], "sigma": [0.5, 0.03], "size": 2},
    "alpha": {"mu": -4, "sigma": 0.1},
    "beta": {"mu": -0.1, "sigma": 0.2},
    "sigma": 8,
    "init": {"mu": -4, "sigma": 0.1, "size": 1},
}


idata_trend, preds_trend, model = make_latent_AR_trend_model(y_t, priors_0, full_sample=True)

Sampling: [alpha, ar, beta, coefs, likelihood, sigma]
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [coefs, sigma, ar, alpha, beta]

Sampling 4 chains for 1_000 tune and 2_000 draw iterations (4_000 + 8_000 draws total) took 57 seconds.
Sampling: [likelihood]

Sampling: [ar1_fut, likelihood, yhat_fut]


pm.model_to_graphviz(model)


plot_fits(idata_trend, preds_trend);


az.summary(idata_trend, var_names=["coefs", "sigma", "alpha", "beta"])


t_data = list(range(200))
n_order = 10
periods = np.array(t_data) / 7

fourier_features = pd.DataFrame(
    {
        f"{func}_order_{order}": getattr(np, func)(2 * np.pi * periods * order)
        for order in range(1, n_order + 1)
        for func in ("sin", "cos")
    }
)

y_t_s = y_t + 20 * fourier_features["sin_order_1"]

fig, ax = plt.subplots(figsize=(10, 4))
ax.plot(y_t_s)
ax.set_title("AR + Trend + Seasonality");


def make_latent_AR_trend_seasonal_model(
    ar_data, ff, priors, prediction_steps=250, full_sample=True, samples=2000
):
    with pm.Model() as AR:
        pass

    ff = ff.to_numpy().T
    t_data = list(range(len(ar_data)))
    AR.add_coord("obs_id", t_data, mutable=True)
    ## The fourier features must be mutable to allow for addition fourier features to be
    ## passed in the prediction step.
    AR.add_coord("fourier_features", np.arange(len(ff)), mutable=True)

    with AR:
        ## Data containers to enable prediction
        t = pm.MutableData("t", t_data, dims="obs_id")
        y = pm.MutableData("y", ar_data, dims="obs_id")
        # The first coefficient will be the intercept term
        coefs = pm.Normal("coefs", priors["coefs"]["mu"], priors["coefs"]["sigma"])
        sigma = pm.HalfNormal("sigma", priors["sigma"])
        # We need one init variable for each lag, hence size is variable too
        init = pm.Normal.dist(
            priors["init"]["mu"], priors["init"]["sigma"], size=priors["init"]["size"]
        )
        # Steps of the AR model minus the lags required given specification
        ar1 = pm.AR(
            "ar",
            coefs,
            sigma=sigma,
            init_dist=init,
            constant=True,
            steps=t.shape[0] - (priors["coefs"]["size"] - 1),
            dims="obs_id",
        )

        ## Priors for the linear trend component
        alpha = pm.Normal("alpha", priors["alpha"]["mu"], priors["alpha"]["sigma"])
        beta = pm.Normal("beta", priors["beta"]["mu"], priors["beta"]["sigma"])
        trend = pm.Deterministic("trend", alpha + beta * t, dims="obs_id")

        ## Priors for seasonality
        beta_fourier = pm.Normal(
            "beta_fourier",
            mu=priors["beta_fourier"]["mu"],
            sigma=priors["beta_fourier"]["sigma"],
            dims="fourier_features",
        )
        fourier_terms = pm.MutableData("fourier_terms", ff)
        seasonality = pm.Deterministic(
            "seasonality", pm.math.dot(beta_fourier, fourier_terms), dims="obs_id"
        )

        mu = ar1 + trend + seasonality

        # The Likelihood
        outcome = pm.Normal("likelihood", mu=mu, sigma=sigma, observed=y, dims="obs_id")
        ## Sampling
        idata_ar = pm.sample_prior_predictive()
        if full_sample:
            idata_ar.extend(pm.sample(samples, random_seed=100, target_accept=0.95))
            idata_ar.extend(pm.sample_posterior_predictive(idata_ar))
        else:
            return idata_ar

    n = prediction_steps - ar_data.shape[0]
    n_order = 10
    periods = (ar_data.shape[0] + np.arange(n)) / 7

    fourier_features_new = pd.DataFrame(
        {
            f"{func}_order_{order}": getattr(np, func)(2 * np.pi * periods * order)
            for order in range(1, n_order + 1)
            for func in ("sin", "cos")
        }
    )

    with AR:
        AR.add_coords({"obs_id_fut_1": range(ar1_data.shape[0] - 1, prediction_steps, 1)})
        AR.add_coords({"obs_id_fut": range(ar1_data.shape[0], prediction_steps, 1)})
        t_fut = pm.MutableData(
            "t_fut", list(range(ar1_data.shape[0], prediction_steps, 1)), dims="obs_id_fut"
        )
        ff_fut = pm.MutableData("ff_fut", fourier_features_new.to_numpy().T)
        # condition on the learned values of the AR process
        # initialise the future AR process precisely at the last observed value in the AR process
        # using the special feature of the dirac delta distribution to be 0 probability everywhere else.
        ar1_fut = pm.AR(
            "ar1_fut",
            init_dist=pm.DiracDelta.dist(ar1[..., -1]),
            rho=coefs,
            sigma=sigma,
            constant=True,
            dims="obs_id_fut_1",
        )
        trend = pm.Deterministic("trend_fut", alpha + beta * t_fut, dims="obs_id_fut")
        seasonality = pm.Deterministic(
            "seasonality_fut", pm.math.dot(beta_fourier, ff_fut), dims="obs_id_fut"
        )
        mu = ar1_fut[1:] + trend + seasonality

        yhat_fut = pm.Normal("yhat_fut", mu=mu, sigma=sigma, dims="obs_id_fut")
        # use the updated values and predict outcomes and probabilities:
        idata_preds = pm.sample_posterior_predictive(
            idata_ar, var_names=["likelihood", "yhat_fut"], predictions=True, random_seed=743
        )

    return idata_ar, idata_preds, AR


priors_0 = {
    "coefs": {"mu": [0.2, 0.2], "sigma": [0.5, 0.03], "size": 2},
    "alpha": {"mu": -4, "sigma": 0.1},
    "beta": {"mu": -0.1, "sigma": 0.2},
    "beta_fourier": {"mu": 0, "sigma": 2},
    "sigma": 8,
    "init": {"mu": -4, "sigma": 0.1, "size": 1},
}


idata_t_s, preds_t_s, model = make_latent_AR_trend_seasonal_model(y_t_s, fourier_features, priors_0)

Sampling: [alpha, ar, beta, beta_fourier, coefs, likelihood, sigma]
Auto-assigning NUTS sampler...
Initializing NUTS using jitter+adapt_diag...
Multiprocess sampling (4 chains in 4 jobs)
NUTS: [coefs, sigma, ar, alpha, beta, beta_fourier]

Sampling 4 chains for 1_000 tune and 2_000 draw iterations (4_000 + 8_000 draws total) took 70 seconds.
Sampling: [likelihood]

Sampling: [ar1_fut, likelihood, yhat_fut]


pm.model_to_graphviz(model)


az.summary(idata_t_s, var_names=["alpha", "beta", "coefs", "beta_fourier"])


plot_fits(idata_t_s, preds_t_s)


%load_ext watermark
%watermark -n -u -v -iv -w -p pytensor,aeppl,xarray

Last updated: Wed Nov 09 2022

Python implementation: CPython
Python version       : 3.9.0
IPython version      : 8.4.0

pytensor: 2.8.7
aeppl : 0.0.38
xarray: 2022.10.0

arviz     : 0.12.1
pymc      : 4.2.2
numpy     : 1.23.4
pandas    : 1.5.1
sys       : 3.9.0 (default, Nov 15 2020, 06:25:35) 
[Clang 10.0.0 ]
matplotlib: 3.6.1

Watermark: 2.3.1

	mean	sd	hdi_3%	hdi_97%	mcse_mean	mcse_sd	ess_bulk	ess_tail	r_hat
coefs[0]	9.744	0.094	9.555	9.911	0.001	0.001	13107.0	6200.0	1.0
coefs[1]	-0.815	0.021	-0.854	-0.776	0.000	0.000	9141.0	5792.0	1.0
sigma	0.506	0.028	0.453	0.557	0.001	0.000	2965.0	5254.0	1.0

	mean	sd	hdi_3%	hdi_97%	mcse_mean	mcse_sd	ess_bulk	ess_tail	r_hat
coefs[0]	1.086	0.475	0.220	2.006	0.010	0.007	2482.0	4278.0	1.0
coefs[1]	0.210	0.029	0.156	0.264	0.000	0.000	7296.0	5931.0	1.0
sigma	7.557	0.389	6.841	8.284	0.007	0.005	3332.0	4817.0	1.0
alpha	-3.969	0.099	-4.171	-3.794	0.001	0.001	9220.0	5606.0	1.0
beta	-0.145	0.009	-0.161	-0.128	0.000	0.000	1785.0	3995.0	1.0

	mean	sd	hdi_3%	hdi_97%	mcse_mean	mcse_sd	ess_bulk	ess_tail	r_hat
alpha	-3.986	0.099	-4.172	-3.797	0.001	0.001	13106.0	6145.0	1.0
beta	-0.182	0.012	-0.204	-0.159	0.000	0.000	3522.0	5420.0	1.0
coefs[0]	0.595	0.484	-0.287	1.536	0.009	0.006	3177.0	5203.0	1.0
coefs[1]	0.195	0.029	0.137	0.246	0.000	0.000	11284.0	6668.0	1.0
beta_fourier[0]	5.700	1.681	2.558	8.785	0.018	0.013	8413.0	5505.0	1.0
beta_fourier[1]	0.275	1.647	-2.913	3.280	0.018	0.018	8501.0	5712.0	1.0
beta_fourier[2]	0.188	1.641	-2.862	3.241	0.017	0.017	9114.0	5857.0	1.0
beta_fourier[3]	-0.066	1.669	-3.209	3.026	0.018	0.018	8683.0	6748.0	1.0
beta_fourier[4]	0.172	1.667	-2.771	3.382	0.017	0.018	9684.0	6683.0	1.0
beta_fourier[5]	-0.143	1.668	-3.285	2.910	0.017	0.018	9728.0	5846.0	1.0
beta_fourier[6]	-0.176	1.624	-3.215	2.860	0.017	0.018	9020.0	5924.0	1.0
beta_fourier[7]	-0.151	1.672	-3.222	3.015	0.017	0.018	9259.0	6636.0	1.0
beta_fourier[8]	-0.174	1.659	-3.277	2.944	0.017	0.018	9347.0	6390.0	1.0
beta_fourier[9]	-0.021	1.637	-3.198	2.878	0.018	0.017	8138.0	6374.0	1.0
beta_fourier[10]	-5.691	1.683	-8.789	-2.487	0.018	0.013	8219.0	6287.0	1.0
beta_fourier[11]	0.298	1.652	-2.769	3.415	0.018	0.018	8453.0	5843.0	1.0
beta_fourier[12]	0.016	2.041	-3.673	3.914	0.016	0.026	15708.0	5857.0	1.0
beta_fourier[13]	5.603	1.333	3.018	7.990	0.023	0.016	3460.0	5277.0	1.0
beta_fourier[14]	5.691	1.650	2.570	8.754	0.018	0.013	8261.0	6341.0	1.0
beta_fourier[15]	0.289	1.634	-2.897	3.245	0.018	0.018	8464.0	6278.0	1.0
beta_fourier[16]	0.214	1.654	-2.989	3.200	0.017	0.017	9169.0	6719.0	1.0
beta_fourier[17]	-0.031	1.663	-3.224	2.996	0.018	0.019	8464.0	5444.0	1.0
beta_fourier[18]	0.177	1.683	-2.978	3.316	0.018	0.020	9126.0	5907.0	1.0
beta_fourier[19]	-0.146	1.669	-3.339	2.925	0.018	0.019	8771.0	6316.0	1.0

Forecasting with Structural AR Timeseries¶

Generate Fake Autoregressive Data¶

Specifying the Model¶

Prediction Step¶

Inspecting model fit and forecast¶

Complicating the Picture¶

Wrapping our model into a function¶

Specifying a Trend Model¶

Complicating the picture further¶

Specifying the Trend + Seasonal Model¶

Closing Remarks¶

Authors¶

Watermark¶