import numpy as np
from matplotlib import pyplot as plt
import seaborn as sns
np.random.seed(0)

n_cust = 200  # The number of customers we are simulating
n_obs = 10    # The number of observations per customer (i.e., choices, or purchases within the category)
n_alts = 3    # The number of choice alternatives
n_feats = 2   # The number of features of the alternatives (e.g., price, promotion)

n_pars = n_alts + n_feats - 1
coef_idx = [j for j in range(n_alts-1, n_pars)]

X = np.random.normal(size=(n_cust, n_obs, n_alts, n_feats))

def softmax(x):
    return np.exp(x)/sum(np.exp(x))

# DGP
mu = np.random.normal(loc=0, scale=1, size=(n_alts+n_feats-1))
sigma = np.random.uniform(low=0.5, high=1.5, size=n_pars)
theta = np.random.multivariate_normal(mean=mu, cov=np.diag(sigma), size=n_cust)

y = np.zeros((n_cust,n_obs), dtype=int)
for i in range(n_cust):
    for t in range(n_obs):
        v = np.zeros(n_alts)
        v[0] = theta[i,coef_idx] @ X[i,t,0]      # Normalize first brand's intercept
        for j in range(1,n_alts):
            v[j] = theta[i,j-1] + theta[i,coef_idx] @ X[i,t,j]
        probs = softmax(v)
        y[i,t] = np.random.choice(n_alts, size=1, p=probs)[0]+1

import cmdstanpy

stan_mixed_logit_example_code = """
  data {
    int<lower=1> n_cust;
    int<lower=1> n_obs; // assumes every customer as the same number of obs
    int<lower=1> n_alts;
    int<lower=1> n_feats;
    array[n_cust, n_obs, n_alts, n_feats] real X;
    array[n_cust, n_obs] int<lower=1,upper=n_alts> y; 
  }
  transformed data {
    // create some convenient indexes
    int<lower=1> n_pars = n_alts+n_feats-1;
  }
  parameters {
      matrix[n_pars, n_cust] z_theta;
      vector[n_pars] mu;
      cholesky_factor_corr[n_pars] L_Omega;
      vector<lower=0>[n_pars] sigma;
  }
  transformed parameters {
      matrix[n_pars, n_cust] theta;
      theta = rep_matrix(mu, n_cust) + diag_matrix(sqrt(sigma)) * z_theta;
  }
  model {
      to_vector(z_theta) ~ normal(0,1);
      sigma ~ cauchy(0,2.5); 
      mu ~ normal(0,5);
      
      for (i in 1:n_cust) {
        for (t in 1:n_obs) {
          vector[n_alts] utils;   // temp variable
          utils[1] = dot_product(theta[n_alts:n_pars,i], to_vector(X[i,t,1]));
          for (j in 2:n_alts) {
              utils[j] = theta[j-1,i] + dot_product(theta[n_alts:n_pars,i], to_vector(X[i,t,j]));
          }
          
          y[i,t] ~ categorical_logit(utils);
        }
    }
  }

"""

model = cmdstanpy.CmdStanModel(stan_file="mixed_logit.stan");

stan_data = {
    "n_cust": n_cust,
    "n_obs": n_obs,
    "n_alts": n_alts,
    "n_feats": n_feats,
    "X": X,
    "y": y
}

fit = model.sample(stan_data, chains=1, seed=0)

09:35:13 - cmdstanpy - INFO - CmdStan start processing

chain 1 |          | 00:00 Status

09:35:57 - cmdstanpy - INFO - CmdStan done processing.

# Access the posterior draws of mu:
mu_samples_stan_nuts = fit.stan_variable('mu')

fig, axs = plt.subplots(2, 2, figsize=(10, 8))
for i, mu_val in enumerate(mu):
    # Get the corresponding mu1_trace
    ax = axs[i // 2, i % 2]
    sns.histplot(mu_samples_stan_nuts[:,i], bins=30, kde=True, ax=ax, label="NUTS", stat='density')
    ax.axvline(x=mu_val, color='red', linestyle='--', linewidth=2)
    ax.set_xlabel('Samples')
    ax.set_ylabel('Density')
    ax.set_title(f'Posterior of $\\mu_{{{i}}}$')

# Adjust the layout
plt.tight_layout()
plt.legend()
# Show the plots
plt.show()

vi = model.variational(data=stan_data, seed=0)

09:35:57 - cmdstanpy - INFO - Chain [1] start processing
09:36:00 - cmdstanpy - INFO - Chain [1] done processing

fig, axs = plt.subplots(2, 2, figsize=(10, 8))
for i, mu_val in enumerate(mu):
    # Get the corresponding mu1_trace
    ax = axs[i // 2, i % 2]
    sns.histplot(mu_samples_stan_nuts[:,i], bins=30, kde=True, ax=ax, label="NUTS", stat='density')
    sns.histplot(vi.variational_sample[:, vi.column_names.index(f'mu[{i+1}]')], bins=30, kde=True, ax=ax, label='ADVI', stat='density')
    ax.axvline(x=mu_val, color='red', linestyle='--', linewidth=2)
    ax.set_xlabel('Samples')
    ax.set_ylabel('Density')
    ax.set_title(f'Posterior of $\\mu_{{{i}}}$')

# Adjust the layout
plt.tight_layout()
plt.legend()
# Show the plots
plt.show()

fig, axs = plt.subplots(2, 2, figsize=(10, 8))
for i, mu_val in enumerate(mu):
    # Get the corresponding mu1_trace
    ax = axs[i // 2, i % 2]
    sns.histplot(fit.stan_variable('theta')[:,0,i], bins=30, kde=True, ax=ax, label="NUTS", stat='density')
    sns.histplot(vi.variational_sample[:, vi.column_names.index(f'theta[{i+1},1]')], bins=30, kde=True, ax=ax, label='ADVI', stat='density')
    ax.set_xlabel('Samples')
    ax.set_ylabel('Density')
    ax.set_title(f'Posterior of $\\theta_{{1,{i}}}$')

# Adjust the layout
plt.tight_layout()
plt.legend()
# Show the plots
plt.show()

pf = model.pathfinder(
    data=stan_data, 
    psis_resample=False, 
    seed=0,
    inits=0.1,
    num_paths=10,
    num_single_draws=40, 
    draws=1000,
    history_size=100, 
    max_lbfgs_iters=100,
)

09:36:01 - cmdstanpy - INFO - Chain [1] start processing
09:36:26 - cmdstanpy - INFO - Chain [1] done processing

fig, axs = plt.subplots(2, 2, figsize=(10, 8))
for i, mu_val in enumerate(mu):
    # Get the corresponding mu1_trace
    ax = axs[i // 2, i % 2]
    sns.histplot(mu_samples_stan_nuts[:,i], bins=30, kde=True, ax=ax, label="NUTS", stat='density')
    sns.histplot(pf.draws()[:, pf.column_names.index(f'mu[{i+1}]')], bins=30, kde=True, ax=ax, label='Pathfinder', stat='density')
    ax.axvline(x=mu_val, color='red', linestyle='--', linewidth=2)
    ax.set_xlabel('Samples')
    ax.set_ylabel('Density')
    ax.set_title(f'Posterior of $\\mu_{{{i}}}$')

# Adjust the layout
plt.tight_layout()
plt.legend()
# Show the plots
plt.show()

import torch
import pyro
import pyro.distributions as dist
import torch.nn.functional as F

torch.set_default_dtype(torch.float64)

# Setting the random seed for reproducibility
pyro.set_rng_seed(0)

pyro_data = {}
pyro_data['X'] = torch.tensor(X.reshape((n_cust*n_obs, n_alts, n_feats)))
pyro_data['y'] = torch.tensor(y.reshape(-1) - 1)
pyro_data['id'] = torch.tensor(torch.repeat_interleave(torch.arange(n_cust), n_obs))

n_obs_total, n_brands, n_feats = pyro_data['X'].shape
n_nonzero_icepts = n_brands - 1
n_pars = n_nonzero_icepts + n_feats

/var/folders/4r/l9kj4wmj7rx3hjwq2vqrshg00000gq/T/ipykernel_10348/784393635.py:4: UserWarning: To copy construct from a tensor, it is recommended to use sourceTensor.clone().detach() or sourceTensor.clone().detach().requires_grad_(True), rather than torch.tensor(sourceTensor).
  pyro_data['id'] = torch.tensor(torch.repeat_interleave(torch.arange(n_cust), n_obs))

# Define model
def pyro_model(X, y, id):
    mu = pyro.sample("mu", dist.Normal(0, 5).expand([n_pars]).to_event(1))
    sigma = pyro.sample("sigma", dist.HalfNormal(5).expand([n_pars]).to_event(1))
    with pyro.plate("coefs", n_cust):
        theta = pyro.sample("theta", dist.Normal(mu, sigma).to_event(1))
        
    theta_icepts = theta[:, :n_nonzero_icepts]
    theta_feats = theta[:, n_nonzero_icepts:]

    zeros_for_first_brand = torch.zeros((n_obs_total, 1))
    theta_icepts_with_zero = torch.cat([zeros_for_first_brand, theta_icepts[id]], dim=1)
    theta_feats_expanded = theta_feats[id].unsqueeze(1)
    X_weighted = X * theta_feats_expanded
    utils = theta_icepts_with_zero + torch.sum(X_weighted, dim=-1)

    p = F.softmax(utils, dim=-1)
    with pyro.plate("data", len(y)):
        pyro.sample("choices", dist.Categorical(probs=p), obs=y)

from pyro.infer import MCMC, NUTS
kernel = NUTS(pyro_model)
mcmc = MCMC(kernel, num_samples=1000, warmup_steps=1000)
mcmc.run(pyro_data["X"], pyro_data["y"], pyro_data["id"])

Sample: 100%|██████████| 2000/2000 [00:52, 38.43it/s, step size=2.25e-01, acc. prob=0.841]

pyro_nuts_samples = {k: v.detach().cpu().numpy() for k, v in mcmc.get_samples().items()}

fig, axs = plt.subplots(2, 2, figsize=(10, 8))
for i, mu_val in enumerate(mu):
    ax = axs[i // 2, i % 2]
    sns.histplot(mu_samples_stan_nuts[:,i], bins=30, kde=True, ax=ax, label="Stan", stat='density')
    sns.histplot(pyro_nuts_samples['mu'][:,i], bins=30, kde=True, ax=ax, label='Pyro', stat='density')
    ax.axvline(x=mu_val, color='red', linestyle='--', linewidth=2)
    ax.set_xlabel('Samples')
    ax.set_ylabel('Density')
    ax.set_title(f'Posterior of $\\mu_{{{i}}}$')
plt.tight_layout()
plt.legend()
plt.show()

from pyro.infer import SVI, Trace_ELBO
from pyro.infer.autoguide import AutoNormal
from pyro.optim import Adam
from tqdm import trange

guide = AutoNormal(pyro_model)
optimizer = Adam({"lr": 0.01})
svi = SVI(pyro_model, guide, optimizer, loss=Trace_ELBO())

num_steps = 2000
losses = []
for step in trange(num_steps):
    loss = svi.step(pyro_data['X'], pyro_data['y'], pyro_data['id'])
    losses.append(loss)

100%|██████████| 2000/2000 [00:04<00:00, 436.66it/s]

plt.plot(losses)

[<matplotlib.lines.Line2D at 0x31c2ee920>]

from pyro.infer import Predictive
predictive = Predictive(pyro_model, guide=guide, num_samples=1000)
svi_samples = predictive(pyro_data['X'], pyro_data['y'], pyro_data['id'])

fig, axs = plt.subplots(2, 2, figsize=(10, 8))
for i, mu_val in enumerate(mu):
    ax = axs[i // 2, i % 2]
    sns.histplot(pyro_nuts_samples['mu'][:,i], bins=30, kde=True, ax=ax, label="NUTS", stat='density')
    sns.histplot(svi_samples['mu'].detach().numpy()[:,0,i], bins=30, kde=True, ax=ax, label='SVI', stat='density')
    ax.axvline(x=mu_val, color='red', linestyle='--', linewidth=2)
    ax.set_xlabel('Samples')
    ax.set_ylabel('Density')
    ax.set_title(f'Posterior of $\\mu_{{{i}}}$')
plt.tight_layout()
plt.legend()
plt.show()

fig, axs = plt.subplots(2, 2, figsize=(10, 8))
for i, mu_val in enumerate(mu):
    ax = axs[i // 2, i % 2]
    sns.histplot(pyro_nuts_samples['theta'][:,0,i], bins=30, kde=True, ax=ax, label="NUTS", stat='density')
    sns.histplot(svi_samples['theta'].detach().numpy()[:,0,i], bins=30, kde=True, ax=ax, label='SVI', stat='density')
    ax.set_xlabel('Samples')
    ax.set_ylabel('Density')
    ax.set_title(f'Posterior of $\\theta_{{1,{i}}}$')
plt.tight_layout()
plt.legend()
plt.show()

from pyro.infer.autoguide import AutoMultivariateNormal

guide_mvn = AutoMultivariateNormal(pyro_model)
optimizer = Adam({"lr": 0.01})
svi_mvn = SVI(pyro_model, guide_mvn, optimizer, loss=Trace_ELBO())

num_steps = 2000
losses = []
for step in trange(num_steps):
    loss = svi_mvn.step(pyro_data['X'], pyro_data['y'], pyro_data['id'])
    losses.append(loss)

100%|██████████| 2000/2000 [00:21<00:00, 93.52it/s]

plt.plot(losses)

[<matplotlib.lines.Line2D at 0x31da013f0>]

predictive = Predictive(pyro_model, guide=guide_mvn, num_samples=1000)
svi_samples = predictive(pyro_data['X'], pyro_data['y'], pyro_data['id'])

fig, axs = plt.subplots(2, 2, figsize=(10, 8))
for i, mu_val in enumerate(mu):
    ax = axs[i // 2, i % 2]
    sns.histplot(pyro_nuts_samples['mu'][:,i], bins=30, kde=True, ax=ax, label="NUTS", stat='density')
    sns.histplot(svi_samples['mu'].detach().numpy()[:,0,i], bins=30, kde=True, ax=ax, label='SVI', stat='density')
    ax.axvline(x=mu_val, color='red', linestyle='--', linewidth=2)
    ax.set_xlabel('Samples')
    ax.set_ylabel('Density')
    ax.set_title(f'Posterior of $\\mu_{{{i}}}$')
plt.tight_layout()
plt.legend()
plt.show()

pyro.clear_param_store()

guide = AutoNormal(pyro_model)
optimizer = Adam({"lr": 0.01})
svi = SVI(pyro_model, guide, optimizer, loss=Trace_ELBO(num_particles=10))

num_steps = 2000
losses = []
for step in trange(num_steps):
    loss = svi.step(pyro_data['X'], pyro_data['y'], pyro_data['id'])
    losses.append(loss)

100%|██████████| 2000/2000 [00:42<00:00, 47.53it/s]

predictive = Predictive(pyro_model, guide=guide, num_samples=1000)
svi_samples = predictive(pyro_data['X'], pyro_data['y'], pyro_data['id'])

fig, axs = plt.subplots(2, 2, figsize=(10, 8))
for i, mu_val in enumerate(mu):
    ax = axs[i // 2, i % 2]
    sns.histplot(pyro_nuts_samples['mu'][:,i], bins=30, kde=True, ax=ax, label="NUTS", stat='density')
    sns.histplot(svi_samples['mu'].detach().numpy()[:,0,i], bins=30, kde=True, ax=ax, label='SVI', stat='density')
    ax.axvline(x=mu_val, color='red', linestyle='--', linewidth=2)
    ax.set_xlabel('Samples')
    ax.set_ylabel('Density')
    ax.set_title(f'Posterior of $\\mu_{{{i}}}$')
plt.tight_layout()
plt.legend()
plt.show()

pyro.clear_param_store()

guide_mvn = AutoMultivariateNormal(pyro_model)
optimizer = Adam({"lr": 0.01})
svi_mvn = SVI(pyro_model, guide_mvn, optimizer, loss=Trace_ELBO(num_particles=10))

num_steps = 2000
losses = []
for step in trange(num_steps):
    loss = svi_mvn.step(pyro_data['X'], pyro_data['y'], pyro_data['id'])
    losses.append(loss)

100%|██████████| 2000/2000 [02:55<00:00, 11.41it/s]

predictive = Predictive(pyro_model, guide=guide_mvn, num_samples=1000)
svi_samples = predictive(pyro_data['X'], pyro_data['y'], pyro_data['id'])

fig, axs = plt.subplots(2, 2, figsize=(10, 8))
for i, mu_val in enumerate(mu):
    ax = axs[i // 2, i % 2]
    sns.histplot(pyro_nuts_samples['mu'][:,i], bins=30, kde=True, ax=ax, label="NUTS", stat='density')
    sns.histplot(svi_samples['mu'].detach().numpy()[:,0,i], bins=30, kde=True, ax=ax, label='SVI', stat='density')
    ax.axvline(x=mu_val, color='red', linestyle='--', linewidth=2)
    ax.set_xlabel('Samples')
    ax.set_ylabel('Density')
    ax.set_title(f'Posterior of $\\mu_{{{i}}}$')
plt.tight_layout()
plt.legend()
plt.show()

def custom_guide(X, y, id):
    mu_loc = pyro.param("mu_loc", torch.zeros(n_pars))
    mu_scale = pyro.param("mu_scale", 0.1*torch.ones(n_pars), constraint=dist.constraints.positive)
    mu = pyro.sample("mu", dist.Normal(mu_loc, mu_scale).to_event(1))

    sigma_delta = pyro.param("sigma_delta", torch.ones(n_pars), constraint=dist.constraints.positive)
    sigma = pyro.sample("sigma", dist.Delta(sigma_delta).to_event(1))
    
    theta_loc = pyro.param(f"theta_loc", torch.zeros((n_cust,n_pars)))
    theta_scale = pyro.param(f"theta_scale", 0.1*torch.ones((n_cust,n_pars)), constraint=dist.constraints.positive)
    with pyro.plate("coefs", n_cust):
        theta = pyro.sample(f"theta", dist.StudentT(torch.tensor(2.0), theta_loc, theta_scale).to_event(1))

pyro.clear_param_store()

optimizer = Adam({"lr": 1e-2})
svi_custom = SVI(pyro_model, custom_guide, optimizer, loss=Trace_ELBO(num_particles=10))

num_steps = 2000
losses = []
for step in trange(num_steps):
    loss = svi_custom.step(pyro_data['X'], pyro_data['y'], pyro_data['id'])
    losses.append(loss)

100%|██████████| 2000/2000 [00:37<00:00, 53.14it/s]

predictive = Predictive(pyro_model, guide=custom_guide, num_samples=1000)
svi_samples = predictive(pyro_data['X'], pyro_data['y'], pyro_data['id'])

fig, axs = plt.subplots(2, 2, figsize=(10, 8))
for i, mu_val in enumerate(mu):
    ax = axs[i // 2, i % 2]
    sns.histplot(pyro_nuts_samples['mu'][:,i], bins=30, kde=True, ax=ax, label="NUTS", stat='density')
    sns.histplot(svi_samples['mu'].detach().numpy()[:,0,i], bins=30, kde=True, ax=ax, label='SVI', stat='density')
    ax.axvline(x=mu_val, color='red', linestyle='--', linewidth=2)
    ax.set_xlabel('Samples')
    ax.set_ylabel('Density')
    ax.set_title(f'Posterior of $\\mu_{{{i}}}$')
plt.tight_layout()
plt.legend()
plt.show()

import pyro.poutine as poutine
from pyro.infer.autoguide import AutoGuideList, AutoDelta, AutoLowRankMultivariateNormal

list_guide = AutoGuideList(pyro_model)
list_guide.append(AutoNormal(poutine.block(pyro_model, expose=["mu"])))
list_guide.append(AutoDelta(poutine.block(pyro_model, expose=["sigma"])))
list_guide.append(AutoLowRankMultivariateNormal(poutine.block(pyro_model, hide=["mu","sigma"])))

pyro.clear_param_store()

optimizer = Adam({"lr": 1e-2})
svi_custom = SVI(pyro_model, list_guide, optimizer, loss=Trace_ELBO(num_particles=10))

num_steps = 2000
losses = []
for step in trange(num_steps):
    loss = svi_custom.step(pyro_data['X'], pyro_data['y'], pyro_data['id'])
    losses.append(loss)

100%|██████████| 2000/2000 [01:06<00:00, 30.17it/s]

predictive = Predictive(pyro_model, guide=list_guide, num_samples=1000)
svi_samples = predictive(pyro_data['X'], pyro_data['y'], pyro_data['id'])

fig, axs = plt.subplots(2, 2, figsize=(10, 8))
for i, mu_val in enumerate(mu):
    ax = axs[i // 2, i % 2]
    sns.histplot(pyro_nuts_samples['mu'][:,i], bins=30, kde=True, ax=ax, label="NUTS", stat='density')
    sns.histplot(svi_samples['mu'].detach().numpy()[:,0,i], bins=30, kde=True, ax=ax, label='SVI', stat='density')
    ax.axvline(x=mu_val, color='red', linestyle='--', linewidth=2)
    ax.set_xlabel('Samples')
    ax.set_ylabel('Density')
    ax.set_title(f'Posterior of $\\mu_{{{i}}}$')
plt.tight_layout()
plt.legend()
plt.show()

n_cust = 40000 # A new number of customers; we leave the remaining settings as before (10 choices per customer, 3 alternatives, 2 features)

theta = np.random.multivariate_normal(mean=mu, cov=np.diag(sigma), size=n_cust)
X = np.random.normal(size=(n_cust, n_obs, n_alts, n_feats))

y = np.zeros((n_cust,n_obs), dtype=int)
for i in range(n_cust):
    for t in range(n_obs):
        v = np.zeros(n_alts)
        v[0] = theta[i,coef_idx] @ X[i,t,0]   
        for j in range(1,n_alts):
            v[j] = theta[i,j-1] + theta[i,coef_idx] @ X[i,t,j]
        probs = softmax(v)
        y[i,t] = np.random.choice(n_alts, size=1, p=probs)[0]+1

pyro_bigger_data = {}
pyro_bigger_data['X'] = torch.tensor(X.reshape((n_cust*n_obs, n_alts, n_feats)))
pyro_bigger_data['y'] = torch.tensor(y.reshape(-1) - 1)
pyro_bigger_data['id'] = torch.tensor(torch.repeat_interleave(torch.arange(n_cust), n_obs))

n_obs_total, n_brands, n_feats = pyro_bigger_data['X'].shape
n_nonzero_icepts = n_brands - 1
n_pars = n_nonzero_icepts + n_feats

/var/folders/4r/l9kj4wmj7rx3hjwq2vqrshg00000gq/T/ipykernel_10348/239420210.py:4: UserWarning: To copy construct from a tensor, it is recommended to use sourceTensor.clone().detach() or sourceTensor.clone().detach().requires_grad_(True), rather than torch.tensor(sourceTensor).
  pyro_bigger_data['id'] = torch.tensor(torch.repeat_interleave(torch.arange(n_cust), n_obs))

pyro.clear_param_store()

kernel = NUTS(pyro_model)
mcmc = MCMC(kernel, num_samples=1000, warmup_steps=1000)
mcmc.run(pyro_bigger_data["X"], pyro_bigger_data["y"], pyro_bigger_data["id"])

Sample: 100%|██████████| 2000/2000 [1:51:20,  3.34s/it, step size=7.23e-02, acc. prob=0.792]

pyro_bigger_nuts_samples = {k: v.detach().cpu().numpy() for k, v in mcmc.get_samples().items()}

pyro.clear_param_store()

guide = AutoNormal(pyro_model)
optimizer = Adam({"lr": 0.01})
svi_bigger = SVI(pyro_model, guide, optimizer, loss=Trace_ELBO(num_particles=10))

num_steps = 2000
losses = []
for step in trange(num_steps):
    loss = svi_bigger.step(pyro_bigger_data['X'], pyro_bigger_data['y'], pyro_bigger_data['id'])
    losses.append(loss)

100%|██████████| 2000/2000 [14:49<00:00,  2.25it/s]

plt.plot(losses[1000:])

[<matplotlib.lines.Line2D at 0x31f675660>]

predictive = Predictive(pyro_model, guide=guide, num_samples=1000)
svi_samples_mfn = predictive(pyro_bigger_data['X'], pyro_bigger_data['y'], pyro_bigger_data['id'])

pyro.clear_param_store()

optimizer = Adam({"lr": 0.01})
svi_bigger = SVI(pyro_model, custom_guide, optimizer, loss=Trace_ELBO(num_particles=10))

num_steps = 2000
losses = []
for step in trange(num_steps):
    loss = svi_bigger.step(pyro_bigger_data['X'], pyro_bigger_data['y'], pyro_bigger_data['id'])
    losses.append(loss)

100%|██████████| 2000/2000 [16:38<00:00,  2.00it/s]

predictive = Predictive(pyro_model, guide=custom_guide, num_samples=1000)
svi_samples_vem = predictive(pyro_bigger_data['X'], pyro_bigger_data['y'], pyro_bigger_data['id'])

fig, axs = plt.subplots(2, 2, figsize=(10, 8))
for i, mu_val in enumerate(mu):
    ax = axs[i // 2, i % 2]
    sns.histplot(pyro_bigger_nuts_samples['mu'][:,i], bins=30, kde=True, ax=ax, label="NUTS", stat='density')
    sns.histplot(svi_samples_mfn['mu'].detach().numpy()[:,0,i], bins=30, kde=True, ax=ax, label='SVI-MF', stat='density')
    sns.histplot(svi_samples_vem['mu'].detach().numpy()[:,0,i], bins=30, kde=True, ax=ax, label='SVI-VEM', stat='density')
    ax.axvline(x=mu_val, color='red', linestyle='--', linewidth=2)
    ax.set_xlabel('Samples')
    ax.set_ylabel('Density')
    ax.set_title(f'Posterior of $\\mu_{{{i}}}$')

# Adjust the layout
plt.tight_layout()
plt.legend()
# Show the plots
plt.show()

fig, axs = plt.subplots(2, 2, figsize=(10, 8))
for i, mu_val in enumerate(mu):
    ax = axs[i // 2, i % 2]
    sns.histplot(pyro_bigger_nuts_samples['theta'][:,0,i], bins=30, kde=True, ax=ax, label="NUTS", stat='density')
    sns.histplot(svi_samples_mfn['theta'].detach().numpy()[:,0,i], bins=30, kde=True, ax=ax, label='SVI-MF', stat='density')
    sns.histplot(svi_samples_vem['theta'].detach().numpy()[:,0,i], bins=30, kde=True, ax=ax, label='SVI-VEM', stat='density')
    ax.set_xlabel('Samples')
    ax.set_ylabel('Density')
    ax.set_title(f'Posterior of $\\theta_{{1,{i}}}$')
plt.tight_layout()
plt.legend()
plt.show()

Code Companion¶

Table of Contents¶

Introduction¶

DGP: Mixed Logit¶

Inference with Stan¶

Inference: HMC/NUTS¶

Inference: ADVI¶

Inference: Pathfinder VI¶

Inference with Pyro¶

Inference: NUTS¶

Inference: SVI (BBVI)¶

Illustration: Usefulness of VI¶

Final Thoughts¶

Additional Models and Resources¶