Update week 3 materials

biosustain · Mar 18, 2024 · 0f758a9 · 0f758a9
1 parent c6e9abd
commit 0f758a9
Show file tree

Hide file tree

Showing 11 changed files with 807 additions and 320 deletions.
diff --git a/docs/index.html b/docs/index.html
diff --git a/docs/metropolis-hastings.html b/docs/metropolis-hastings.html
diff --git a/docs/search.json b/docs/search.json
diff --git a/docs/site_libs/bootstrap/bootstrap.min.css b/docs/site_libs/bootstrap/bootstrap.min.css
diff --git a/docs/site_libs/quarto-nav/quarto-nav.js b/docs/site_libs/quarto-nav/quarto-nav.js
@@ -237,6 +237,7 @@ window.document.addEventListener("DOMContentLoaded", function () {
     const links = window.document.querySelectorAll("a");
     for (let i = 0; i < links.length; i++) {
       if (links[i].href) {
+        links[i].dataset.originalHref = links[i].href;
         links[i].href = links[i].href.replace(/\/index\.html/, "/");
       }
     }

diff --git a/docs/site_libs/quarto-search/quarto-search.js b/docs/site_libs/quarto-search/quarto-search.js
@@ -675,6 +675,18 @@ function showCopyLink(query, options) {
 // create the index
 var fuseIndex = undefined;
 var shownWarning = false;
+
+// fuse index options
+const kFuseIndexOptions = {
+  keys: [
+    { name: "title", weight: 20 },
+    { name: "section", weight: 20 },
+    { name: "text", weight: 10 },
+  ],
+  ignoreLocation: true,
+  threshold: 0.1,
+};
+
 async function readSearchData() {
   // Initialize the search index on demand
   if (fuseIndex === undefined) {
@@ -685,17 +697,7 @@ async function readSearchData() {
       shownWarning = true;
       return;
     }
-    // create fuse index
-    const options = {
-      keys: [
-        { name: "title", weight: 20 },
-        { name: "section", weight: 20 },
-        { name: "text", weight: 10 },
-      ],
-      ignoreLocation: true,
-      threshold: 0.1,
-    };
-    const fuse = new window.Fuse([], options);
+    const fuse = new window.Fuse([], kFuseIndexOptions);
 
     // fetch the main search.json
     const response = await fetch(offsetURL("search.json"));
@@ -1226,8 +1228,34 @@ function algoliaSearch(query, limit, algoliaOptions) {
   });
 }
 
-function fuseSearch(query, fuse, fuseOptions) {
-  return fuse.search(query, fuseOptions).map((result) => {
+let subSearchTerm = undefined;
+let subSearchFuse = undefined;
+const kFuseMaxWait = 125;
+
+async function fuseSearch(query, fuse, fuseOptions) {
+  let index = fuse;
+  // Fuse.js using the Bitap algorithm for text matching which runs in
+  // O(nm) time (no matter the structure of the text). In our case this
+  // means that long search terms mixed with large index gets very slow
+  //
+  // This injects a subIndex that will be used once the terms get long enough
+  // Usually making this subindex is cheap since there will typically be
+  // a subset of results matching the existing query
+  if (subSearchFuse !== undefined && query.startsWith(subSearchTerm)) {
+    // Use the existing subSearchFuse
+    index = subSearchFuse;
+  } else if (subSearchFuse !== undefined) {
+    // The term changed, discard the existing fuse
+    subSearchFuse = undefined;
+    subSearchTerm = undefined;
+  }
+
+  // Search using the active fuse
+  const then = performance.now();
+  const resultsRaw = await index.search(query, fuseOptions);
+  const now = performance.now();
+
+  const results = resultsRaw.map((result) => {
     const addParam = (url, name, value) => {
       const anchorParts = url.split("#");
       const baseUrl = anchorParts[0];
@@ -1244,4 +1272,15 @@ function fuseSearch(query, fuse, fuseOptions) {
       crumbs: result.item.crumbs,
     };
   });
+
+  // If we don't have a subfuse and the query is long enough, go ahead
+  // and create a subfuse to use for subsequent queries
+  if (now - then > kFuseMaxWait && subSearchFuse === undefined) {
+    subSearchTerm = query;
+    subSearchFuse = new window.Fuse([], kFuseIndexOptions);
+    resultsRaw.forEach((rr) => {
+      subSearchFuse.add(rr.item);
+    });
+  }
+  return results;
 }
diff --git a/docs/week1.html b/docs/week1.html
diff --git a/docs/week2.html b/docs/week2.html
diff --git a/docs/week3.html b/docs/week3.html
diff --git a/materials/_quarto.yml b/materials/_quarto.yml
@@ -11,8 +11,8 @@ project:
     - index.md
     - week1.md
     - week2.md
-    - week3.qmd
     - metropolis-hastings.qmd
+    - week3.qmd
 
 website:
   title: "Bayesian Statistics for Computational Biology"
@@ -31,8 +31,8 @@ website:
         contents:
         - week1.md
         - week2.md
-        - week3.qmd
         - metropolis-hastings.qmd
+        - week3.qmd
 
 format:
   html:

diff --git a/materials/week3.qmd b/materials/week3.qmd
@@ -3,7 +3,6 @@
 Plan for today:
 
 - After MCMC: [diagnostics](#mcmc-diagnostics), [model evaluation](#model-evaluation), [results](#Results)
-- Code your own Metropolis-Hastings sampler
 
 Recap from last week:
 
@@ -48,7 +47,28 @@ Find out more:
 
 # Model evaluation
 
-## Very quick decision theory
+## Retrospective 'predictive' checks
+
+**Predictive distribution**: what a model that can replicate its measurements
+says about those measurements, i.e. $p(y^{rep})$.
+
+It's very useful to check these things:
+
+- The prior predictive distribution should not allocate much probability mass to
+  replicated measurements that are obviously impossible.
+
+- If any actual measurements lie in a region with low prior predictive
+  probability (e.g. if measurement $i$ is too low so that $p(y^rep_i>y_i) =
+  0.99$), that shows that the prior model is inconsistent with the measurements.
+
+- If there are systematic differences between the posterior predictive
+  distribution and the observed measurements, that is a sign that the model is
+  inconsistent with the measurements.
+
+Since predictive checking depends on pattern-matching it is often a good idea to
+use graphs for it.
+
+## Scoring models with loss functions
 
 **Loss function**: If the observation is $y$ and the model says $p(y) = z$, how
 bad is that?
@@ -89,7 +109,6 @@ Out of sample log likelihood can often be approximated cheaply: see
 
 Find out more: [@landesObjectiveBayesianismMaximum2013, section 2.3] 
 
-
 # Results
 
 Some useful summary statistics:
@@ -100,26 +119,51 @@ Mean | "What does the model think is the most likely value"
 Standard deviation | "How sure is my model about this?"
 Quantile n | "What is x s.t. my model is n% sure that the quantity is at least x?"
 
-Do I have enough samples? To find out, calculate the [Monte Carlo Standard Error](https://mc-stan.org/docs/reference-manual/effective-sample-size.html#estimation-of-mcmc-standard-error).
+Do I have enough samples? To find out, calculate the [Monte Carlo standard error](https://mc-stan.org/docs/reference-manual/effective-sample-size.html#estimation-of-mcmc-standard-error).
 
 :::{.callout-important}
-MCSE can vary for different statistics relating to the same quantity
+Monte Carlo standard error can vary for different statistics relating to the same quantity
 :::
 
 # Example
 
 We'll go through some diagnostics using [arviz](https://python.arviz.org).
 
+Step one is to load some data. Rather than going through a whole modelling
+workflow, we'll just take one of the example MCMC outputs that arviz provides
+via the function [`load_arviz_data`](https://python.arviz.org/en/stable/api/
+generated/arviz.load_arviz_data.html).
+
+This particular MCMC output has to do with measurements of soil radioactivity in
+the USA. You can read more about it [here](https://docs.pymc.io/notebooks/multilevel_modeling.html).
+
 ```{python}
 import arviz as az
-import numpy as np
-import xarray as xr
+import numpy as np  # numpy is for numerical programming
+import xarray as xr  # xarray is for manipulating n dimensional tables; arviz uses it a lot! 
 
 idata = az.load_arviz_data("radon")
 idata
 ```
 
-The function `az.summary` lets us look at some useful summary statistics,
+Arviz provides a data structure called [`InferenceData`](https://
+python.arviz.org/en/latest/api/inference_data.html) which it uses for storing
+MCMC outputs. It's worth getting to know it: there is some helpful explanation
+[here](https://python.arviz.org/en/latest/schema/schema.html). 
+
+At a high level, an `InferenceData` is a container for several xarray
+`Dataset` objects called 'groups'. Each group contains xarray [`DataArray`]
+(https:// docs.xarray.dev/ en/stable/generated/xarray.DataArray.html) objects
+called 'variables'. Each variable contains a rectangular array of values,
+plus the shape of the values ('dimensions') and labels for the dimensions
+('coordinates').
+
+For example, if you click on the dropdown arrows above you will see that
+the group `posterior` contains a variable called `a_county` that has three
+dimensions called `chain`, `draw` and `County`. There are 85 counties and the
+first one is labelled `'AITKIN'`.
+
+The function [`az.summary`](https://python.arviz.org/en/latest/api/generated/arviz.summary.html) lets us look at some useful summary statistics,
 including $\hat{R}$, divergent transitions and MCSE.
 
 The variable `lp`, which you can find in the group `sample_stats` is the
@@ -139,10 +183,29 @@ this case the group is called `posterior`.
 az.summary(idata.posterior, var_names=["sigma", "g"])
 ```
 
+In this case there were no post-warmup diverging transitions, and the $\hat{R}$
+statistic for the `lp` variable is pretty close to 1: great!
+
+Now we can start evaluating the model. First we check to see whether replicated
+measurements from the model's posterior predictive distribution broadly agree
+with the observed measurements, using the arviz function [`plot_lm`](https://python.arviz.org/en/latest/api/generated/arviz.plot_lm.html#arviz.plot_lm):
+
+```{python}
+az.style.use("arviz-doc")
+az.plot_lm(
+    y=idata.observed_data["y"],
+    x=idata.observed_data["obs_id"],
+    y_hat=idata.posterior_predictive["y"],
+    figsize=[12, 5],
+    grid=False
+);
+```
+
 The function `az.loo` performs approximate leave-one-out cross validation, which
 can be useful for evaluating how well the model might make predictions. Watch
 out for the `warning` column, which can tell you if the approximation is likely
-to be incorrect.
+to be incorrect. It's usually a good idea to set the `pointwise` argument to
+`True`, as this allows for more detailed analysis at the per-observation level.
 
 ```{python}
 az.loo(idata, var_name="y", pointwise=True)
@@ -159,13 +222,19 @@ idata.log_likelihood["fake"] = xr.DataArray(
     coords=idata.log_likelihood.coords,
     dims=idata.log_likelihood.dims
 )
-az.compare(
+comparison = az.compare(
     {
         "real": az.loo(idata, var_name="y"), 
         "fake": az.loo(idata, var_name="fake")
     }
 )
+comparison
 
 ```
 
-az.plot_ppc(j)
+The function [`az.plot_compare`](https://python.arviz.org/en/latest/api/generated/arviz.plot_compare.html) shows these results on a nice graph:
+
+```{python}
+az.plot_compare(comparison);
+    
+```