Skip to content

Instantly share code, notes, and snippets.

@canyon289
Last active March 3, 2021 05:41
Show Gist options
  • Save canyon289/97c94048d51ad3af80474f3adfa9c611 to your computer and use it in GitHub Desktop.
Save canyon289/97c94048d51ad3af80474f3adfa9c611 to your computer and use it in GitHub Desktop.
Display the source blob
Display the rendered blob
Raw
{
"cells": [
{
"cell_type": "markdown",
"id": "missing-community",
"metadata": {},
"source": [
"# Trying to Group Level and individual level out of sample predictions\n",
"But running into two questions\n",
"1. Is adding RVs after sampling, for posterior predictive sampling, an abuse of the api?\n",
"2. Why do unconditioned RVs affect the logp for the model? (and alter sampling)"
]
},
{
"cell_type": "code",
"execution_count": 1,
"id": "alpine-light",
"metadata": {},
"outputs": [],
"source": [
"import pymc3 as pm\n",
"import matplotlib.pyplot as plt\n",
"import arviz as az\n",
"import pandas as pd\n",
"import numpy as np\n",
"from scipy import stats\n",
"import theano"
]
},
{
"cell_type": "code",
"execution_count": 2,
"id": "economic-great",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"'3.11.0'"
]
},
"execution_count": 2,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"pm.__version__"
]
},
{
"cell_type": "markdown",
"id": "defensive-ozone",
"metadata": {},
"source": [
"# Make some data"
]
},
{
"cell_type": "code",
"execution_count": 3,
"id": "architectural-cameroon",
"metadata": {
"jupyter": {
"source_hidden": true
}
},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Finished location 0\n",
"Finished location 1\n",
"Finished location 2\n",
"Finished location 3\n",
"Finished location 4\n",
"Finished location 5\n"
]
}
],
"source": [
"def salad_generator(hyperprior_beta_mean=5, hyperprior_beta_sd=.3, sigma=50, days_per_location=[5, 3, 15, 10, 3, 5]):\n",
" \"\"\"Generate noisy salad data\"\"\"\n",
" beta_hyperprior = stats.norm(hyperprior_beta_mean, hyperprior_beta_sd)\n",
" \n",
" # Generate demands days per restaurant\n",
" df = pd.DataFrame()\n",
" for i, days in enumerate(days_per_location):\n",
" np.random.seed(0)\n",
"\n",
" num_customers = stats.randint(30, 100).rvs(days)\n",
" sales_location = beta_hyperprior.rvs()*num_customers + stats.norm(0, sigma).rvs(num_customers.shape)\n",
"\n",
" location_df = pd.DataFrame({\"customers\":num_customers, \"sales\":sales_location})\n",
" location_df[\"location\"] = i\n",
" location_df.sort_values(by=\"customers\", ascending=True)\n",
" df = pd.concat([df, location_df])\n",
"\n",
" print(f\"Finished location {i}\")\n",
" df.reset_index(inplace=True, drop=True)\n",
" return df\n",
"hierarchical_salad_df = salad_generator()"
]
},
{
"cell_type": "code",
"execution_count": 4,
"id": "handy-brush",
"metadata": {},
"outputs": [
{
"data": {
"image/png": "\n",
"text/plain": [
"<Figure size 576x432 with 6 Axes>"
]
},
"metadata": {
"needs_background": "light"
},
"output_type": "display_data"
}
],
"source": [
"fig, axes, = plt.subplots(2,3, sharex=True, sharey=True, figsize=(8,6))\n",
"\n",
"for i, ax in enumerate(axes.ravel()):\n",
" location_filter = (hierarchical_salad_df[\"location\"] == i)\n",
" hierarchical_salad_df[location_filter].plot(kind=\"scatter\", x=\"customers\", y=\"sales\", ax=ax)\n",
" ax.set_xlabel(\"\")\n",
" ax.set_ylabel(\"\")\n",
"\n",
"fig.suptitle(\"A bunch of simulated data \\n for a Hierarchical model\") \n",
"axes[1,0].set_xlabel(\"Number of Customers\")\n",
"axes[1,0].set_ylabel(\"Sales\");"
]
},
{
"cell_type": "code",
"execution_count": 5,
"id": "super-aquarium",
"metadata": {},
"outputs": [],
"source": [
"customers = hierarchical_salad_df.loc[:, \"customers\"].values\n",
"sales = hierarchical_salad_df.loc[:, \"sales\"].values\n",
"location_category = pd.Categorical(hierarchical_salad_df[\"location\"])"
]
},
{
"cell_type": "markdown",
"id": "needed-feature",
"metadata": {},
"source": [
"# Sample Non Centered"
]
},
{
"cell_type": "code",
"execution_count": 6,
"id": "forty-showcase",
"metadata": {},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"/home/canyon/miniconda3/envs/cargo/lib/python3.9/site-packages/pymc3/sampling.py:465: FutureWarning: In an upcoming release, pm.sample will return an `arviz.InferenceData` object instead of a `MultiTrace` by default. You can pass return_inferencedata=True or return_inferencedata=False to be safe and silence this warning.\n",
" warnings.warn(\n",
"Auto-assigning NUTS sampler...\n",
"Initializing NUTS using jitter+adapt_diag...\n",
"Multiprocess sampling (4 chains in 4 jobs)\n",
"NUTS: [β_offset, β_σ_hyperprior, β_μ_hyperprior, σ]\n"
]
},
{
"data": {
"text/html": [
"\n",
" <div>\n",
" <style>\n",
" /* Turns off some styling */\n",
" progress {\n",
" /* gets rid of default border in Firefox and Opera. */\n",
" border: none;\n",
" /* Needs to be in here for Safari polyfill so background images work as expected. */\n",
" background-size: auto;\n",
" }\n",
" .progress-bar-interrupted, .progress-bar-interrupted::-webkit-progress-bar {\n",
" background: #F44336;\n",
" }\n",
" </style>\n",
" <progress value='8000' class='' max='8000' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
" 100.00% [8000/8000 00:03<00:00 Sampling 4 chains, 81 divergences]\n",
" </div>\n",
" "
],
"text/plain": [
"<IPython.core.display.HTML object>"
]
},
"metadata": {},
"output_type": "display_data"
},
{
"name": "stderr",
"output_type": "stream",
"text": [
"/home/canyon/miniconda3/envs/cargo/lib/python3.9/site-packages/pymc3/math.py:246: RuntimeWarning: divide by zero encountered in log1p\n",
" return np.where(x < 0.6931471805599453, np.log(-np.expm1(-x)), np.log1p(-np.exp(-x)))\n",
"/home/canyon/miniconda3/envs/cargo/lib/python3.9/site-packages/pymc3/math.py:246: RuntimeWarning: divide by zero encountered in log1p\n",
" return np.where(x < 0.6931471805599453, np.log(-np.expm1(-x)), np.log1p(-np.exp(-x)))\n",
"/home/canyon/miniconda3/envs/cargo/lib/python3.9/site-packages/pymc3/math.py:246: RuntimeWarning: divide by zero encountered in log1p\n",
" return np.where(x < 0.6931471805599453, np.log(-np.expm1(-x)), np.log1p(-np.exp(-x)))\n",
"/home/canyon/miniconda3/envs/cargo/lib/python3.9/site-packages/pymc3/math.py:246: RuntimeWarning: divide by zero encountered in log1p\n",
" return np.where(x < 0.6931471805599453, np.log(-np.expm1(-x)), np.log1p(-np.exp(-x)))\n",
"Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 4 seconds.\n",
"There were 17 divergences after tuning. Increase `target_accept` or reparameterize.\n",
"There were 10 divergences after tuning. Increase `target_accept` or reparameterize.\n",
"There were 27 divergences after tuning. Increase `target_accept` or reparameterize.\n",
"There were 27 divergences after tuning. Increase `target_accept` or reparameterize.\n",
"The number of effective samples is smaller than 25% for some parameters.\n"
]
}
],
"source": [
"with pm.Model() as model_hierarchical_salad_sales_predictions:\n",
" \n",
" σ = pm.HalfNormal(\"σ\", 20)\n",
" \n",
" β_μ_hyperprior = pm.Normal(\"β_μ_hyperprior\", 10, 10)\n",
" β_σ_hyperprior = pm.HalfNormal(\"β_σ_hyperprior\", 10)\n",
" β_offset = pm.Normal('β_offset', mu=0, sd=1, shape=6)\n",
" \n",
" β = pm.Deterministic(\"β\", β_μ_hyperprior + β_offset * β_σ_hyperprior)\n",
" \n",
" μ = pm.Deterministic('μ', β[location_category.codes] * hierarchical_salad_df.customers)\n",
" \n",
" sales = pm.Normal(\"sales\", mu=μ, sd=σ, observed=hierarchical_salad_df.sales)\n",
" \n",
" trace_hierarchical_salad_sales_noncentered = pm.sample(random_seed=0)\n",
" \n",
" inf_data_hierarchical_salad_sales_noncentered = az.from_pymc3(trace=trace_hierarchical_salad_sales_noncentered, \n",
" coords={\"β_dim_0\":location_category.categories})"
]
},
{
"cell_type": "code",
"execution_count": 7,
"id": "focused-hampshire",
"metadata": {},
"outputs": [
{
"data": {
"image/svg+xml": [
"<?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\"?>\n",
"<!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\n",
" \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\">\n",
"<!-- Generated by graphviz version 2.42.3 (20191010.1750)\n",
" -->\n",
"<!-- Title: %3 Pages: 1 -->\n",
"<svg width=\"419pt\" height=\"452pt\"\n",
" viewBox=\"0.00 0.00 418.54 451.86\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\">\n",
"<g id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 447.86)\">\n",
"<title>%3</title>\n",
"<polygon fill=\"white\" stroke=\"transparent\" points=\"-4,4 -4,-447.86 414.54,-447.86 414.54,4 -4,4\"/>\n",
"<g id=\"clust1\" class=\"cluster\">\n",
"<title>cluster6</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M162.42,-232.91C162.42,-232.91 246.42,-232.91 246.42,-232.91 252.42,-232.91 258.42,-238.91 258.42,-244.91 258.42,-244.91 258.42,-423.86 258.42,-423.86 258.42,-429.86 252.42,-435.86 246.42,-435.86 246.42,-435.86 162.42,-435.86 162.42,-435.86 156.42,-435.86 150.42,-429.86 150.42,-423.86 150.42,-423.86 150.42,-244.91 150.42,-244.91 150.42,-238.91 156.42,-232.91 162.42,-232.91\"/>\n",
"<text text-anchor=\"middle\" x=\"246.92\" y=\"-240.71\" font-family=\"Times,serif\" font-size=\"14.00\">6</text>\n",
"</g>\n",
"<g id=\"clust2\" class=\"cluster\">\n",
"<title>cluster41</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M162.42,-8C162.42,-8 246.42,-8 246.42,-8 252.42,-8 258.42,-14 258.42,-20 258.42,-20 258.42,-209.93 258.42,-209.93 258.42,-215.93 252.42,-221.93 246.42,-221.93 246.42,-221.93 162.42,-221.93 162.42,-221.93 156.42,-221.93 150.42,-215.93 150.42,-209.93 150.42,-209.93 150.42,-20 150.42,-20 150.42,-14 156.42,-8 162.42,-8\"/>\n",
"<text text-anchor=\"middle\" x=\"243.42\" y=\"-15.8\" font-family=\"Times,serif\" font-size=\"14.00\">41</text>\n",
"</g>\n",
"<!-- β_μ_hyperprior -->\n",
"<g id=\"node1\" class=\"node\">\n",
"<title>β_μ_hyperprior</title>\n",
"<ellipse fill=\"none\" stroke=\"black\" cx=\"71.42\" cy=\"-390.38\" rx=\"71.34\" ry=\"37.45\"/>\n",
"<text text-anchor=\"middle\" x=\"71.42\" y=\"-401.68\" font-family=\"Times,serif\" font-size=\"14.00\">β_μ_hyperprior</text>\n",
"<text text-anchor=\"middle\" x=\"71.42\" y=\"-386.68\" font-family=\"Times,serif\" font-size=\"14.00\">~</text>\n",
"<text text-anchor=\"middle\" x=\"71.42\" y=\"-371.68\" font-family=\"Times,serif\" font-size=\"14.00\">Normal</text>\n",
"</g>\n",
"<!-- β -->\n",
"<g id=\"node4\" class=\"node\">\n",
"<title>β</title>\n",
"<polygon fill=\"none\" stroke=\"black\" points=\"249.92,-316.91 158.92,-316.91 158.92,-263.91 249.92,-263.91 249.92,-316.91\"/>\n",
"<text text-anchor=\"middle\" x=\"204.42\" y=\"-301.71\" font-family=\"Times,serif\" font-size=\"14.00\">β</text>\n",
"<text text-anchor=\"middle\" x=\"204.42\" y=\"-286.71\" font-family=\"Times,serif\" font-size=\"14.00\">~</text>\n",
"<text text-anchor=\"middle\" x=\"204.42\" y=\"-271.71\" font-family=\"Times,serif\" font-size=\"14.00\">Deterministic</text>\n",
"</g>\n",
"<!-- β_μ_hyperprior&#45;&gt;β -->\n",
"<g id=\"edge2\" class=\"edge\">\n",
"<title>β_μ_hyperprior&#45;&gt;β</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M112.04,-359.45C127.66,-347.95 145.52,-334.79 161.36,-323.13\"/>\n",
"<polygon fill=\"black\" stroke=\"black\" points=\"163.45,-325.93 169.43,-317.18 159.3,-320.29 163.45,-325.93\"/>\n",
"</g>\n",
"<!-- σ -->\n",
"<g id=\"node2\" class=\"node\">\n",
"<title>σ</title>\n",
"<ellipse fill=\"none\" stroke=\"black\" cx=\"326.42\" cy=\"-187.43\" rx=\"58.88\" ry=\"37.45\"/>\n",
"<text text-anchor=\"middle\" x=\"326.42\" y=\"-198.73\" font-family=\"Times,serif\" font-size=\"14.00\">σ</text>\n",
"<text text-anchor=\"middle\" x=\"326.42\" y=\"-183.73\" font-family=\"Times,serif\" font-size=\"14.00\">~</text>\n",
"<text text-anchor=\"middle\" x=\"326.42\" y=\"-168.73\" font-family=\"Times,serif\" font-size=\"14.00\">HalfNormal</text>\n",
"</g>\n",
"<!-- sales -->\n",
"<g id=\"node7\" class=\"node\">\n",
"<title>sales</title>\n",
"<ellipse fill=\"lightgrey\" stroke=\"black\" cx=\"206.42\" cy=\"-76.48\" rx=\"41.94\" ry=\"37.45\"/>\n",
"<text text-anchor=\"middle\" x=\"206.42\" y=\"-87.78\" font-family=\"Times,serif\" font-size=\"14.00\">sales</text>\n",
"<text text-anchor=\"middle\" x=\"206.42\" y=\"-72.78\" font-family=\"Times,serif\" font-size=\"14.00\">~</text>\n",
"<text text-anchor=\"middle\" x=\"206.42\" y=\"-57.78\" font-family=\"Times,serif\" font-size=\"14.00\">Normal</text>\n",
"</g>\n",
"<!-- σ&#45;&gt;sales -->\n",
"<g id=\"edge5\" class=\"edge\">\n",
"<title>σ&#45;&gt;sales</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M293.31,-156.37C277.69,-142.19 259,-125.22 242.97,-110.66\"/>\n",
"<polygon fill=\"black\" stroke=\"black\" points=\"245.09,-107.86 235.34,-103.73 240.39,-113.05 245.09,-107.86\"/>\n",
"</g>\n",
"<!-- β_σ_hyperprior -->\n",
"<g id=\"node3\" class=\"node\">\n",
"<title>β_σ_hyperprior</title>\n",
"<ellipse fill=\"none\" stroke=\"black\" cx=\"338.42\" cy=\"-390.38\" rx=\"72.25\" ry=\"37.45\"/>\n",
"<text text-anchor=\"middle\" x=\"338.42\" y=\"-401.68\" font-family=\"Times,serif\" font-size=\"14.00\">β_σ_hyperprior</text>\n",
"<text text-anchor=\"middle\" x=\"338.42\" y=\"-386.68\" font-family=\"Times,serif\" font-size=\"14.00\">~</text>\n",
"<text text-anchor=\"middle\" x=\"338.42\" y=\"-371.68\" font-family=\"Times,serif\" font-size=\"14.00\">HalfNormal</text>\n",
"</g>\n",
"<!-- β_σ_hyperprior&#45;&gt;β -->\n",
"<g id=\"edge3\" class=\"edge\">\n",
"<title>β_σ_hyperprior&#45;&gt;β</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M297.49,-359.45C281.76,-347.95 263.75,-334.79 247.8,-323.13\"/>\n",
"<polygon fill=\"black\" stroke=\"black\" points=\"249.81,-320.26 239.67,-317.18 245.68,-325.91 249.81,-320.26\"/>\n",
"</g>\n",
"<!-- μ -->\n",
"<g id=\"node6\" class=\"node\">\n",
"<title>μ</title>\n",
"<polygon fill=\"none\" stroke=\"black\" points=\"249.92,-213.93 158.92,-213.93 158.92,-160.93 249.92,-160.93 249.92,-213.93\"/>\n",
"<text text-anchor=\"middle\" x=\"204.42\" y=\"-198.73\" font-family=\"Times,serif\" font-size=\"14.00\">μ</text>\n",
"<text text-anchor=\"middle\" x=\"204.42\" y=\"-183.73\" font-family=\"Times,serif\" font-size=\"14.00\">~</text>\n",
"<text text-anchor=\"middle\" x=\"204.42\" y=\"-168.73\" font-family=\"Times,serif\" font-size=\"14.00\">Deterministic</text>\n",
"</g>\n",
"<!-- β&#45;&gt;μ -->\n",
"<g id=\"edge4\" class=\"edge\">\n",
"<title>β&#45;&gt;μ</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M204.42,-263.66C204.42,-251.68 204.42,-237.22 204.42,-224.19\"/>\n",
"<polygon fill=\"black\" stroke=\"black\" points=\"207.92,-224.12 204.42,-214.12 200.92,-224.12 207.92,-224.12\"/>\n",
"</g>\n",
"<!-- β_offset -->\n",
"<g id=\"node5\" class=\"node\">\n",
"<title>β_offset</title>\n",
"<ellipse fill=\"none\" stroke=\"black\" cx=\"204.42\" cy=\"-390.38\" rx=\"43.68\" ry=\"37.45\"/>\n",
"<text text-anchor=\"middle\" x=\"204.42\" y=\"-401.68\" font-family=\"Times,serif\" font-size=\"14.00\">β_offset</text>\n",
"<text text-anchor=\"middle\" x=\"204.42\" y=\"-386.68\" font-family=\"Times,serif\" font-size=\"14.00\">~</text>\n",
"<text text-anchor=\"middle\" x=\"204.42\" y=\"-371.68\" font-family=\"Times,serif\" font-size=\"14.00\">Normal</text>\n",
"</g>\n",
"<!-- β_offset&#45;&gt;β -->\n",
"<g id=\"edge1\" class=\"edge\">\n",
"<title>β_offset&#45;&gt;β</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M204.42,-352.9C204.42,-344.48 204.42,-335.54 204.42,-327.16\"/>\n",
"<polygon fill=\"black\" stroke=\"black\" points=\"207.92,-326.92 204.42,-316.92 200.92,-326.92 207.92,-326.92\"/>\n",
"</g>\n",
"<!-- μ&#45;&gt;sales -->\n",
"<g id=\"edge6\" class=\"edge\">\n",
"<title>μ&#45;&gt;sales</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M204.89,-160.89C205.09,-149.98 205.33,-136.89 205.56,-124.35\"/>\n",
"<polygon fill=\"black\" stroke=\"black\" points=\"209.06,-124.06 205.75,-114 202.06,-123.94 209.06,-124.06\"/>\n",
"</g>\n",
"</g>\n",
"</svg>\n"
],
"text/plain": [
"<graphviz.dot.Digraph at 0x7f9ec3ac18b0>"
]
},
"execution_count": 7,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"pm.model_to_graphviz(model_hierarchical_salad_sales_predictions)"
]
},
{
"cell_type": "markdown",
"id": "modular-consolidation",
"metadata": {},
"source": [
"# Question 1\n",
"Is this an abuse of the API to generate posterior predictive for the group level and location level by adding vars after sampling?"
]
},
{
"cell_type": "code",
"execution_count": 8,
"id": "tired-smart",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"\n",
" <div>\n",
" <style>\n",
" /* Turns off some styling */\n",
" progress {\n",
" /* gets rid of default border in Firefox and Opera. */\n",
" border: none;\n",
" /* Needs to be in here for Safari polyfill so background images work as expected. */\n",
" background-size: auto;\n",
" }\n",
" .progress-bar-interrupted, .progress-bar-interrupted::-webkit-progress-bar {\n",
" background: #F44336;\n",
" }\n",
" </style>\n",
" <progress value='4000' class='' max='4000' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
" 100.00% [4000/4000 00:07<00:00]\n",
" </div>\n",
" "
],
"text/plain": [
"<IPython.core.display.HTML object>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"out_of_sample_customers = 50\n",
"\n",
"with model_hierarchical_salad_sales_predictions:\n",
" β_group = pm.Normal(\"group_beta_prediction\", β_μ_hyperprior, β_σ_hyperprior)\n",
" group_level_prediction = pm.Normal(\"group_level_prediction\", β_group*out_of_sample_customers, σ)\n",
" \n",
" location_4_prediction = pm.Normal(\"location_4_prediction\", β[4]*out_of_sample_customers, σ)\n",
" \n",
" ppc = pm.sample_posterior_predictive(trace_hierarchical_salad_sales_noncentered, var_names=['group_level_prediction', 'location_4_prediction'], )"
]
},
{
"cell_type": "code",
"execution_count": 9,
"id": "outer-level",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array(-11893.11106697)"
]
},
"execution_count": 9,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"model_hierarchical_salad_sales_predictions.logp(model_hierarchical_salad_sales_predictions.test_point)"
]
},
{
"cell_type": "markdown",
"id": "sporting-float",
"metadata": {},
"source": [
"# Question 2\n",
"Sampling is worse in this model when the extra nodes are included, even though they theoretically shouldn't contribute to the likelihood. Notably the number of divergences increases dramatically. For the broad question do these results make sense?"
]
},
{
"cell_type": "code",
"execution_count": 14,
"id": "acute-token",
"metadata": {},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"/home/canyon/miniconda3/envs/cargo/lib/python3.9/site-packages/pymc3/sampling.py:465: FutureWarning: In an upcoming release, pm.sample will return an `arviz.InferenceData` object instead of a `MultiTrace` by default. You can pass return_inferencedata=True or return_inferencedata=False to be safe and silence this warning.\n",
" warnings.warn(\n",
"Auto-assigning NUTS sampler...\n",
"Initializing NUTS using jitter+adapt_diag...\n",
"Multiprocess sampling (4 chains in 4 jobs)\n",
"NUTS: [location_4_predictions, group_prediction, group_beta_prediction, β_offset, β_σ_hyperprior, β_μ_hyperprior, σ]\n"
]
},
{
"data": {
"text/html": [
"\n",
" <div>\n",
" <style>\n",
" /* Turns off some styling */\n",
" progress {\n",
" /* gets rid of default border in Firefox and Opera. */\n",
" border: none;\n",
" /* Needs to be in here for Safari polyfill so background images work as expected. */\n",
" background-size: auto;\n",
" }\n",
" .progress-bar-interrupted, .progress-bar-interrupted::-webkit-progress-bar {\n",
" background: #F44336;\n",
" }\n",
" </style>\n",
" <progress value='8000' class='' max='8000' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
" 100.00% [8000/8000 00:04<00:00 Sampling 4 chains, 1,008 divergences]\n",
" </div>\n",
" "
],
"text/plain": [
"<IPython.core.display.HTML object>"
]
},
"metadata": {},
"output_type": "display_data"
},
{
"name": "stderr",
"output_type": "stream",
"text": [
"/home/canyon/miniconda3/envs/cargo/lib/python3.9/site-packages/pymc3/math.py:246: RuntimeWarning: divide by zero encountered in log1p\n",
" return np.where(x < 0.6931471805599453, np.log(-np.expm1(-x)), np.log1p(-np.exp(-x)))\n",
"/home/canyon/miniconda3/envs/cargo/lib/python3.9/site-packages/pymc3/math.py:246: RuntimeWarning: divide by zero encountered in log1p\n",
" return np.where(x < 0.6931471805599453, np.log(-np.expm1(-x)), np.log1p(-np.exp(-x)))\n",
"/home/canyon/miniconda3/envs/cargo/lib/python3.9/site-packages/pymc3/math.py:246: RuntimeWarning: divide by zero encountered in log1p\n",
" return np.where(x < 0.6931471805599453, np.log(-np.expm1(-x)), np.log1p(-np.exp(-x)))\n",
"/home/canyon/miniconda3/envs/cargo/lib/python3.9/site-packages/pymc3/math.py:246: RuntimeWarning: divide by zero encountered in log1p\n",
" return np.where(x < 0.6931471805599453, np.log(-np.expm1(-x)), np.log1p(-np.exp(-x)))\n",
"Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 5 seconds.\n",
"There were 149 divergences after tuning. Increase `target_accept` or reparameterize.\n",
"There were 506 divergences after tuning. Increase `target_accept` or reparameterize.\n",
"The acceptance probability does not match the target. It is 0.3882465788481101, but should be close to 0.8. Try to increase the number of tuning steps.\n",
"There were 175 divergences after tuning. Increase `target_accept` or reparameterize.\n",
"There were 178 divergences after tuning. Increase `target_accept` or reparameterize.\n",
"The rhat statistic is larger than 1.05 for some parameters. This indicates slight problems during sampling.\n",
"The estimated number of effective samples is smaller than 200 for some parameters.\n"
]
}
],
"source": [
"# If I used shared vars I get a shape error\n",
"customers = hierarchical_salad_df.loc[:, \"customers\"].values\n",
"customers = theano.shared(customers)\n",
"out_of_sample_customers = 50\n",
"\n",
"with pm.Model() as model_hierarchical_salad_sales_extra_nodes:\n",
" \n",
" σ = pm.HalfNormal(\"σ\", 20)\n",
" \n",
" β_μ_hyperprior = pm.Normal(\"β_μ_hyperprior\", 10, 10)\n",
" β_σ_hyperprior = pm.HalfNormal(\"β_σ_hyperprior\", 10)\n",
" β_offset = pm.Normal('β_offset', mu=0, sd=1, shape=6)\n",
" \n",
" β = pm.Deterministic(\"β\", β_μ_hyperprior + β_offset * β_σ_hyperprior)\n",
" \n",
" μ = pm.Deterministic('μ', β[location_category.codes] * customers)\n",
" \n",
" sales = pm.Normal(\"sales\", mu=μ, sd=σ, observed=hierarchical_salad_df.sales)\n",
" \n",
" # Extra nodes for group and individual level predictions\n",
" β_group = pm.Normal(\"group_beta_prediction\", β_μ_hyperprior, β_σ_hyperprior)\n",
" group_prediction = pm.Normal(\"group_prediction\", β_group*out_of_sample_customers, σ)\n",
" location_4_predictions = pm.Normal(\"location_4_predictions\", β[4]*out_of_sample_customers, σ)\n",
" \n",
" trace_hierarchical_salad_sales_noncentered = pm.sample(random_seed=0)\n"
]
},
{
"cell_type": "code",
"execution_count": 11,
"id": "rocky-mistress",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array(-11893.11106697)"
]
},
"execution_count": 11,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"model_hierarchical_salad_sales_extra_nodes.logp(model_hierarchical_salad_sales_extra_nodes.test_point)"
]
},
{
"cell_type": "code",
"execution_count": 15,
"id": "electric-concentrate",
"metadata": {},
"outputs": [
{
"data": {
"image/svg+xml": [
"<?xml version=\"1.0\" encoding=\"UTF-8\" standalone=\"no\"?>\n",
"<!DOCTYPE svg PUBLIC \"-//W3C//DTD SVG 1.1//EN\"\n",
" \"http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd\">\n",
"<!-- Generated by graphviz version 2.42.3 (20191010.1750)\n",
" -->\n",
"<!-- Title: %3 Pages: 1 -->\n",
"<svg width=\"611pt\" height=\"471pt\"\n",
" viewBox=\"0.00 0.00 611.29 470.81\" xmlns=\"http://www.w3.org/2000/svg\" xmlns:xlink=\"http://www.w3.org/1999/xlink\">\n",
"<g id=\"graph0\" class=\"graph\" transform=\"scale(1 1) rotate(0) translate(4 466.81)\">\n",
"<title>%3</title>\n",
"<polygon fill=\"white\" stroke=\"transparent\" points=\"-4,4 -4,-466.81 607.29,-466.81 607.29,4 -4,4\"/>\n",
"<g id=\"clust1\" class=\"cluster\">\n",
"<title>cluster6</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M353.29,-240.88C353.29,-240.88 437.29,-240.88 437.29,-240.88 443.29,-240.88 449.29,-246.88 449.29,-252.88 449.29,-252.88 449.29,-442.81 449.29,-442.81 449.29,-448.81 443.29,-454.81 437.29,-454.81 437.29,-454.81 353.29,-454.81 353.29,-454.81 347.29,-454.81 341.29,-448.81 341.29,-442.81 341.29,-442.81 341.29,-252.88 341.29,-252.88 341.29,-246.88 347.29,-240.88 353.29,-240.88\"/>\n",
"<text text-anchor=\"middle\" x=\"437.79\" y=\"-248.68\" font-family=\"Times,serif\" font-size=\"14.00\">6</text>\n",
"</g>\n",
"<g id=\"clust2\" class=\"cluster\">\n",
"<title>cluster41</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M499.29,-8C499.29,-8 583.29,-8 583.29,-8 589.29,-8 595.29,-14 595.29,-20 595.29,-20 595.29,-209.93 595.29,-209.93 595.29,-215.93 589.29,-221.93 583.29,-221.93 583.29,-221.93 499.29,-221.93 499.29,-221.93 493.29,-221.93 487.29,-215.93 487.29,-209.93 487.29,-209.93 487.29,-20 487.29,-20 487.29,-14 493.29,-8 499.29,-8\"/>\n",
"<text text-anchor=\"middle\" x=\"580.29\" y=\"-15.8\" font-family=\"Times,serif\" font-size=\"14.00\">41</text>\n",
"</g>\n",
"<!-- β_μ_hyperprior -->\n",
"<g id=\"node1\" class=\"node\">\n",
"<title>β_μ_hyperprior</title>\n",
"<ellipse fill=\"none\" stroke=\"black\" cx=\"262.29\" cy=\"-409.34\" rx=\"71.34\" ry=\"37.45\"/>\n",
"<text text-anchor=\"middle\" x=\"262.29\" y=\"-420.64\" font-family=\"Times,serif\" font-size=\"14.00\">β_μ_hyperprior</text>\n",
"<text text-anchor=\"middle\" x=\"262.29\" y=\"-405.64\" font-family=\"Times,serif\" font-size=\"14.00\">~</text>\n",
"<text text-anchor=\"middle\" x=\"262.29\" y=\"-390.64\" font-family=\"Times,serif\" font-size=\"14.00\">Normal</text>\n",
"</g>\n",
"<!-- group_beta_prediction -->\n",
"<g id=\"node4\" class=\"node\">\n",
"<title>group_beta_prediction</title>\n",
"<ellipse fill=\"none\" stroke=\"black\" cx=\"98.29\" cy=\"-298.38\" rx=\"98.08\" ry=\"37.45\"/>\n",
"<text text-anchor=\"middle\" x=\"98.29\" y=\"-309.68\" font-family=\"Times,serif\" font-size=\"14.00\">group_beta_prediction</text>\n",
"<text text-anchor=\"middle\" x=\"98.29\" y=\"-294.68\" font-family=\"Times,serif\" font-size=\"14.00\">~</text>\n",
"<text text-anchor=\"middle\" x=\"98.29\" y=\"-279.68\" font-family=\"Times,serif\" font-size=\"14.00\">Normal</text>\n",
"</g>\n",
"<!-- β_μ_hyperprior&#45;&gt;group_beta_prediction -->\n",
"<g id=\"edge7\" class=\"edge\">\n",
"<title>β_μ_hyperprior&#45;&gt;group_beta_prediction</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M218.77,-379.43C199.17,-366.4 175.78,-350.86 154.84,-336.95\"/>\n",
"<polygon fill=\"black\" stroke=\"black\" points=\"156.61,-333.93 146.34,-331.31 152.74,-339.76 156.61,-333.93\"/>\n",
"</g>\n",
"<!-- β -->\n",
"<g id=\"node7\" class=\"node\">\n",
"<title>β</title>\n",
"<polygon fill=\"none\" stroke=\"black\" points=\"440.79,-324.88 349.79,-324.88 349.79,-271.88 440.79,-271.88 440.79,-324.88\"/>\n",
"<text text-anchor=\"middle\" x=\"395.29\" y=\"-309.68\" font-family=\"Times,serif\" font-size=\"14.00\">β</text>\n",
"<text text-anchor=\"middle\" x=\"395.29\" y=\"-294.68\" font-family=\"Times,serif\" font-size=\"14.00\">~</text>\n",
"<text text-anchor=\"middle\" x=\"395.29\" y=\"-279.68\" font-family=\"Times,serif\" font-size=\"14.00\">Deterministic</text>\n",
"</g>\n",
"<!-- β_μ_hyperprior&#45;&gt;β -->\n",
"<g id=\"edge1\" class=\"edge\">\n",
"<title>β_μ_hyperprior&#45;&gt;β</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M300.04,-377.41C317.49,-363.11 338.21,-346.14 355.86,-331.68\"/>\n",
"<polygon fill=\"black\" stroke=\"black\" points=\"358.21,-334.28 363.73,-325.23 353.78,-328.86 358.21,-334.28\"/>\n",
"</g>\n",
"<!-- σ -->\n",
"<g id=\"node2\" class=\"node\">\n",
"<title>σ</title>\n",
"<ellipse fill=\"none\" stroke=\"black\" cx=\"273.29\" cy=\"-298.38\" rx=\"58.88\" ry=\"37.45\"/>\n",
"<text text-anchor=\"middle\" x=\"273.29\" y=\"-309.68\" font-family=\"Times,serif\" font-size=\"14.00\">σ</text>\n",
"<text text-anchor=\"middle\" x=\"273.29\" y=\"-294.68\" font-family=\"Times,serif\" font-size=\"14.00\">~</text>\n",
"<text text-anchor=\"middle\" x=\"273.29\" y=\"-279.68\" font-family=\"Times,serif\" font-size=\"14.00\">HalfNormal</text>\n",
"</g>\n",
"<!-- group_prediction -->\n",
"<g id=\"node3\" class=\"node\">\n",
"<title>group_prediction</title>\n",
"<ellipse fill=\"none\" stroke=\"black\" cx=\"114.29\" cy=\"-187.43\" rx=\"77.56\" ry=\"37.45\"/>\n",
"<text text-anchor=\"middle\" x=\"114.29\" y=\"-198.73\" font-family=\"Times,serif\" font-size=\"14.00\">group_prediction</text>\n",
"<text text-anchor=\"middle\" x=\"114.29\" y=\"-183.73\" font-family=\"Times,serif\" font-size=\"14.00\">~</text>\n",
"<text text-anchor=\"middle\" x=\"114.29\" y=\"-168.73\" font-family=\"Times,serif\" font-size=\"14.00\">Normal</text>\n",
"</g>\n",
"<!-- σ&#45;&gt;group_prediction -->\n",
"<g id=\"edge9\" class=\"edge\">\n",
"<title>σ&#45;&gt;group_prediction</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M239.59,-267.46C228.92,-258.52 216.88,-248.95 205.29,-240.88 195.47,-234.05 184.7,-227.27 174.12,-220.97\"/>\n",
"<polygon fill=\"black\" stroke=\"black\" points=\"175.7,-217.83 165.3,-215.8 172.16,-223.87 175.7,-217.83\"/>\n",
"</g>\n",
"<!-- location_4_predictions -->\n",
"<g id=\"node6\" class=\"node\">\n",
"<title>location_4_predictions</title>\n",
"<ellipse fill=\"none\" stroke=\"black\" cx=\"379.29\" cy=\"-187.43\" rx=\"98.99\" ry=\"37.45\"/>\n",
"<text text-anchor=\"middle\" x=\"379.29\" y=\"-198.73\" font-family=\"Times,serif\" font-size=\"14.00\">location_4_predictions</text>\n",
"<text text-anchor=\"middle\" x=\"379.29\" y=\"-183.73\" font-family=\"Times,serif\" font-size=\"14.00\">~</text>\n",
"<text text-anchor=\"middle\" x=\"379.29\" y=\"-168.73\" font-family=\"Times,serif\" font-size=\"14.00\">Normal</text>\n",
"</g>\n",
"<!-- σ&#45;&gt;location_4_predictions -->\n",
"<g id=\"edge12\" class=\"edge\">\n",
"<title>σ&#45;&gt;location_4_predictions</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M303.66,-266.16C314.5,-255.02 326.9,-242.28 338.48,-230.38\"/>\n",
"<polygon fill=\"black\" stroke=\"black\" points=\"341.09,-232.71 345.56,-223.1 336.08,-227.83 341.09,-232.71\"/>\n",
"</g>\n",
"<!-- sales -->\n",
"<g id=\"node10\" class=\"node\">\n",
"<title>sales</title>\n",
"<ellipse fill=\"lightgrey\" stroke=\"black\" cx=\"539.29\" cy=\"-76.48\" rx=\"41.94\" ry=\"37.45\"/>\n",
"<text text-anchor=\"middle\" x=\"539.29\" y=\"-87.78\" font-family=\"Times,serif\" font-size=\"14.00\">sales</text>\n",
"<text text-anchor=\"middle\" x=\"539.29\" y=\"-72.78\" font-family=\"Times,serif\" font-size=\"14.00\">~</text>\n",
"<text text-anchor=\"middle\" x=\"539.29\" y=\"-57.78\" font-family=\"Times,serif\" font-size=\"14.00\">Normal</text>\n",
"</g>\n",
"<!-- σ&#45;&gt;sales -->\n",
"<g id=\"edge5\" class=\"edge\">\n",
"<title>σ&#45;&gt;sales</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M261.42,-261.67C253.03,-229.17 247.09,-181.56 271.29,-149.95 297.47,-115.75 417.7,-93.98 487.91,-83.95\"/>\n",
"<polygon fill=\"black\" stroke=\"black\" points=\"488.47,-87.41 497.89,-82.56 487.5,-80.48 488.47,-87.41\"/>\n",
"</g>\n",
"<!-- group_beta_prediction&#45;&gt;group_prediction -->\n",
"<g id=\"edge10\" class=\"edge\">\n",
"<title>group_beta_prediction&#45;&gt;group_prediction</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M103.66,-260.8C104.87,-252.54 106.18,-243.65 107.44,-235.04\"/>\n",
"<polygon fill=\"black\" stroke=\"black\" points=\"110.91,-235.5 108.9,-225.1 103.99,-234.49 110.91,-235.5\"/>\n",
"</g>\n",
"<!-- β_σ_hyperprior -->\n",
"<g id=\"node5\" class=\"node\">\n",
"<title>β_σ_hyperprior</title>\n",
"<ellipse fill=\"none\" stroke=\"black\" cx=\"99.29\" cy=\"-409.34\" rx=\"72.25\" ry=\"37.45\"/>\n",
"<text text-anchor=\"middle\" x=\"99.29\" y=\"-420.64\" font-family=\"Times,serif\" font-size=\"14.00\">β_σ_hyperprior</text>\n",
"<text text-anchor=\"middle\" x=\"99.29\" y=\"-405.64\" font-family=\"Times,serif\" font-size=\"14.00\">~</text>\n",
"<text text-anchor=\"middle\" x=\"99.29\" y=\"-390.64\" font-family=\"Times,serif\" font-size=\"14.00\">HalfNormal</text>\n",
"</g>\n",
"<!-- β_σ_hyperprior&#45;&gt;group_beta_prediction -->\n",
"<g id=\"edge8\" class=\"edge\">\n",
"<title>β_σ_hyperprior&#45;&gt;group_beta_prediction</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M98.95,-371.75C98.88,-363.58 98.8,-354.8 98.72,-346.27\"/>\n",
"<polygon fill=\"black\" stroke=\"black\" points=\"102.22,-346.02 98.62,-336.06 95.22,-346.09 102.22,-346.02\"/>\n",
"</g>\n",
"<!-- β_σ_hyperprior&#45;&gt;β -->\n",
"<g id=\"edge3\" class=\"edge\">\n",
"<title>β_σ_hyperprior&#45;&gt;β</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M151.83,-383.45C161.81,-379.23 172.27,-375.16 182.29,-371.86 251.1,-349.18 274.79,-364.63 341.29,-335.86 345.14,-334.19 349.01,-332.24 352.82,-330.12\"/>\n",
"<polygon fill=\"black\" stroke=\"black\" points=\"354.73,-333.06 361.53,-324.94 351.15,-327.05 354.73,-333.06\"/>\n",
"</g>\n",
"<!-- β&#45;&gt;location_4_predictions -->\n",
"<g id=\"edge11\" class=\"edge\">\n",
"<title>β&#45;&gt;location_4_predictions</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M391.54,-271.84C389.92,-260.82 387.97,-247.58 386.12,-234.92\"/>\n",
"<polygon fill=\"black\" stroke=\"black\" points=\"389.57,-234.34 384.65,-224.95 382.64,-235.36 389.57,-234.34\"/>\n",
"</g>\n",
"<!-- μ -->\n",
"<g id=\"node9\" class=\"node\">\n",
"<title>μ</title>\n",
"<polygon fill=\"none\" stroke=\"black\" points=\"586.79,-213.93 495.79,-213.93 495.79,-160.93 586.79,-160.93 586.79,-213.93\"/>\n",
"<text text-anchor=\"middle\" x=\"541.29\" y=\"-198.73\" font-family=\"Times,serif\" font-size=\"14.00\">μ</text>\n",
"<text text-anchor=\"middle\" x=\"541.29\" y=\"-183.73\" font-family=\"Times,serif\" font-size=\"14.00\">~</text>\n",
"<text text-anchor=\"middle\" x=\"541.29\" y=\"-168.73\" font-family=\"Times,serif\" font-size=\"14.00\">Deterministic</text>\n",
"</g>\n",
"<!-- β&#45;&gt;μ -->\n",
"<g id=\"edge4\" class=\"edge\">\n",
"<title>β&#45;&gt;μ</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M429.52,-271.84C450.22,-256.39 476.78,-236.57 498.82,-220.12\"/>\n",
"<polygon fill=\"black\" stroke=\"black\" points=\"501.1,-222.79 507.02,-214 496.91,-217.18 501.1,-222.79\"/>\n",
"</g>\n",
"<!-- β_offset -->\n",
"<g id=\"node8\" class=\"node\">\n",
"<title>β_offset</title>\n",
"<ellipse fill=\"none\" stroke=\"black\" cx=\"395.29\" cy=\"-409.34\" rx=\"43.68\" ry=\"37.45\"/>\n",
"<text text-anchor=\"middle\" x=\"395.29\" y=\"-420.64\" font-family=\"Times,serif\" font-size=\"14.00\">β_offset</text>\n",
"<text text-anchor=\"middle\" x=\"395.29\" y=\"-405.64\" font-family=\"Times,serif\" font-size=\"14.00\">~</text>\n",
"<text text-anchor=\"middle\" x=\"395.29\" y=\"-390.64\" font-family=\"Times,serif\" font-size=\"14.00\">Normal</text>\n",
"</g>\n",
"<!-- β_offset&#45;&gt;β -->\n",
"<g id=\"edge2\" class=\"edge\">\n",
"<title>β_offset&#45;&gt;β</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M395.29,-371.75C395.29,-360.02 395.29,-347.03 395.29,-335.34\"/>\n",
"<polygon fill=\"black\" stroke=\"black\" points=\"398.79,-335.04 395.29,-325.04 391.79,-335.04 398.79,-335.04\"/>\n",
"</g>\n",
"<!-- μ&#45;&gt;sales -->\n",
"<g id=\"edge6\" class=\"edge\">\n",
"<title>μ&#45;&gt;sales</title>\n",
"<path fill=\"none\" stroke=\"black\" d=\"M540.82,-160.89C540.62,-149.98 540.38,-136.89 540.15,-124.35\"/>\n",
"<polygon fill=\"black\" stroke=\"black\" points=\"543.64,-123.94 539.96,-114 536.64,-124.06 543.64,-123.94\"/>\n",
"</g>\n",
"</g>\n",
"</svg>\n"
],
"text/plain": [
"<graphviz.dot.Digraph at 0x7f9ebd6f7b80>"
]
},
"execution_count": 15,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"pm.model_to_graphviz(model_hierarchical_salad_sales_extra_nodes)"
]
},
{
"cell_type": "markdown",
"id": "flying-volunteer",
"metadata": {},
"source": [
"# The actual right way to do it\n",
"I know this is the right way, just asking about the other 2"
]
},
{
"cell_type": "code",
"execution_count": 16,
"id": "disturbed-works",
"metadata": {},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"/home/canyon/miniconda3/envs/cargo/lib/python3.9/site-packages/pymc3/sampling.py:465: FutureWarning: In an upcoming release, pm.sample will return an `arviz.InferenceData` object instead of a `MultiTrace` by default. You can pass return_inferencedata=True or return_inferencedata=False to be safe and silence this warning.\n",
" warnings.warn(\n",
"Auto-assigning NUTS sampler...\n",
"Initializing NUTS using jitter+adapt_diag...\n",
"Multiprocess sampling (4 chains in 4 jobs)\n",
"NUTS: [β_offset, β_σ_hyperprior, β_μ_hyperprior, σ]\n"
]
},
{
"data": {
"text/html": [
"\n",
" <div>\n",
" <style>\n",
" /* Turns off some styling */\n",
" progress {\n",
" /* gets rid of default border in Firefox and Opera. */\n",
" border: none;\n",
" /* Needs to be in here for Safari polyfill so background images work as expected. */\n",
" background-size: auto;\n",
" }\n",
" .progress-bar-interrupted, .progress-bar-interrupted::-webkit-progress-bar {\n",
" background: #F44336;\n",
" }\n",
" </style>\n",
" <progress value='8000' class='' max='8000' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
" 100.00% [8000/8000 00:03<00:00 Sampling 4 chains, 81 divergences]\n",
" </div>\n",
" "
],
"text/plain": [
"<IPython.core.display.HTML object>"
]
},
"metadata": {},
"output_type": "display_data"
},
{
"name": "stderr",
"output_type": "stream",
"text": [
"/home/canyon/miniconda3/envs/cargo/lib/python3.9/site-packages/pymc3/math.py:246: RuntimeWarning: divide by zero encountered in log1p\n",
" return np.where(x < 0.6931471805599453, np.log(-np.expm1(-x)), np.log1p(-np.exp(-x)))\n",
"/home/canyon/miniconda3/envs/cargo/lib/python3.9/site-packages/pymc3/math.py:246: RuntimeWarning: divide by zero encountered in log1p\n",
" return np.where(x < 0.6931471805599453, np.log(-np.expm1(-x)), np.log1p(-np.exp(-x)))\n",
"/home/canyon/miniconda3/envs/cargo/lib/python3.9/site-packages/pymc3/math.py:246: RuntimeWarning: divide by zero encountered in log1p\n",
" return np.where(x < 0.6931471805599453, np.log(-np.expm1(-x)), np.log1p(-np.exp(-x)))\n",
"/home/canyon/miniconda3/envs/cargo/lib/python3.9/site-packages/pymc3/math.py:246: RuntimeWarning: divide by zero encountered in log1p\n",
" return np.where(x < 0.6931471805599453, np.log(-np.expm1(-x)), np.log1p(-np.exp(-x)))\n",
"Sampling 4 chains for 1_000 tune and 1_000 draw iterations (4_000 + 4_000 draws total) took 3 seconds.\n",
"There were 17 divergences after tuning. Increase `target_accept` or reparameterize.\n",
"There were 10 divergences after tuning. Increase `target_accept` or reparameterize.\n",
"There were 27 divergences after tuning. Increase `target_accept` or reparameterize.\n",
"There were 27 divergences after tuning. Increase `target_accept` or reparameterize.\n",
"The number of effective samples is smaller than 25% for some parameters.\n"
]
}
],
"source": [
"# If I used shared vars I get a shape error\n",
"customers = hierarchical_salad_df.loc[:, \"customers\"].values\n",
"customers = theano.shared(customers)\n",
"\n",
"with pm.Model() as model_hierarchical_salad_sales_extra_nodes:\n",
" \n",
" σ = pm.HalfNormal(\"σ\", 20)\n",
" \n",
" β_μ_hyperprior = pm.Normal(\"β_μ_hyperprior\", 10, 10)\n",
" β_σ_hyperprior = pm.HalfNormal(\"β_σ_hyperprior\", 10)\n",
" β_offset = pm.Normal('β_offset', mu=0, sd=1, shape=6)\n",
" \n",
" β = pm.Deterministic(\"β\", β_μ_hyperprior + β_offset * β_σ_hyperprior)\n",
" \n",
" μ = pm.Deterministic('μ', β[location_category.codes] * customers)\n",
" \n",
" sales = pm.Normal(\"sales\", mu=μ, sd=σ, observed=hierarchical_salad_df.sales)\n",
" trace_hierarchical_salad_sales_noncentered = pm.sample(random_seed=0)\n"
]
},
{
"cell_type": "code",
"execution_count": 22,
"id": "impaired-bleeding",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"\n",
" <div>\n",
" <style>\n",
" /* Turns off some styling */\n",
" progress {\n",
" /* gets rid of default border in Firefox and Opera. */\n",
" border: none;\n",
" /* Needs to be in here for Safari polyfill so background images work as expected. */\n",
" background-size: auto;\n",
" }\n",
" .progress-bar-interrupted, .progress-bar-interrupted::-webkit-progress-bar {\n",
" background: #F44336;\n",
" }\n",
" </style>\n",
" <progress value='4000' class='' max='4000' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
" 100.00% [4000/4000 00:00<00:00]\n",
" </div>\n",
" "
],
"text/plain": [
"<IPython.core.display.HTML object>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"customers.set_value([50])\n",
"with pm.Model() as model_hierarchical_salad_sales_extra_nodes:\n",
" ppc = pm.sample_posterior_predictive(trace_hierarchical_salad_sales_noncentered)"
]
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.9.1"
}
},
"nbformat": 4,
"nbformat_minor": 5
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment