diff --git a/GP.qmd b/GP.qmd
index 61e6d25..2dc8dea 100644
--- a/GP.qmd
+++ b/GP.qmd
@@ -1,6 +1,6 @@
 ---
-title: "VectorByte Methods Training"
-subtitle: "Introduction to Gaussian Processes for Time Dependent Data"
+subtitle: "VectorByte Methods Training"
+title: "Introduction to Gaussian Processes for Time Dependent Data"
 editor: source
 author: "The VectorByte Team (Parul Patil, Virginia Tech)"
 title-slide-attributes:
diff --git a/GP_Notes.qmd b/GP_Notes.qmd
index b8f393b..aeb1ce7 100644
--- a/GP_Notes.qmd
+++ b/GP_Notes.qmd
@@ -1,11 +1,15 @@
 ---
-title: "VectorByte Methods Training"
-subtitle: "Introduction to Gaussian Processes for Time Dependent Data"
-author: "The VectorByte Team (Parul Patil, Virginia Tech)"
+title: "VectorByte Methods Training:  Introduction to Gaussian Processes for Time Dependent Data (notes)"
+author:
+  - name: Parul Patil 
+    affiliation: Virginia Tech and VectorByte
 title-slide-attributes:
   data-background-image: VectorByte-logo_lg.png
   data-background-size: contain
   data-background-opacity: "0.2"
+citation: true
+date: 2024-07-21
+date-format: long
 format:
   html:
     toc: true
diff --git a/GP_Practical.qmd b/GP_Practical.qmd
index d7f70ba..23bf0f2 100644
--- a/GP_Practical.qmd
+++ b/GP_Practical.qmd
@@ -1,7 +1,11 @@
 ---
-title: "VectorByte Methods Training"
-subtitle: "Practical: Introduction to Gaussian Processes for Time Dependent Data"
-author: "The VectorByte Team (Parul Patil, Virginia Tech)"
+title: "VectorByte Methods Training:  Introduction to Gaussian Processes for Time Dependent Data (Practical)"
+author:
+  - name: Parul Patil 
+    affiliation: Virginia Tech and VectorByte
+citation: true
+date: 2024-07-21
+date-format: long
 format:
   html:
     toc: true
diff --git a/Stats_review.qmd b/Stats_review.qmd
index 2e736e0..c863679 100644
--- a/Stats_review.qmd
+++ b/Stats_review.qmd
@@ -1,7 +1,12 @@
 ---
-title: VectorByte Methods Training
-subtitle: Probability and Statistics Fundamentals
-author: The VectorByte Team (Leah R. Johnson, Virginia Tech)
+title: "VectorByte Methods Training: Probability and Statistics Fundamentals"
+author:
+  - name: Leah R. Johnson 
+    url: https://lrjohnson0.github.io/QEDLab/leahJ.html
+    affiliation: Virginia Tech and VectorByte
+citation: true
+date: 2024-07-01
+date-format: long
 format:
   html:
     toc: true
diff --git a/VB_RegDiagTrans.qmd b/VB_RegDiagTrans.qmd
index ef1b52a..84ebd00 100644
--- a/VB_RegDiagTrans.qmd
+++ b/VB_RegDiagTrans.qmd
@@ -1,6 +1,6 @@
 ---
-title: "VectorByte Methods Training"
-subtitle: "Review of Diagnostics and Transformations for Regression Models"
+subtitle: "VectorByte Methods Training"
+title: "Review of Diagnostics and Transformations for Regression Models"
 author: "The VectorByte Team (Leah R. Johnson, Virginia Tech)"
 title-slide-attributes:
   data-background-image: VectorByte-logo_lg.png
diff --git a/VB_RegDiagTrans_practical.qmd b/VB_RegDiagTrans_practical.qmd
index ffd5687..1a64b10 100644
--- a/VB_RegDiagTrans_practical.qmd
+++ b/VB_RegDiagTrans_practical.qmd
@@ -1,7 +1,12 @@
 ---
-title: "VectorByte Methods Training"
-subtitle: "Practical: Diagnostics and Transformations"
-author: "The VectorByte Team (Leah R. Johnson, Virginia Tech)"
+title: "VectorByte Methods Training: Regression Diagnostics and Transformations (practical)"
+author:
+  - name: Leah R. Johnson 
+    url: https://lrjohnson0.github.io/QEDLab/leahJ.html
+    affiliation: Virginia Tech and VectorByte
+citation: true
+date: 2024-07-01
+date-format: long
 format:
   html:
     toc: true
diff --git a/VB_RegRev.qmd b/VB_RegRev.qmd
index d73a8b4..628eb2f 100644
--- a/VB_RegRev.qmd
+++ b/VB_RegRev.qmd
@@ -1,11 +1,12 @@
 ---
-title: "VectorByte Methods Training"
-subtitle: "Regression Review"
-author: "The VectorByte Team (Leah R. Johnson, Virginia Tech)"
-title-slide-attributes:
-  data-background-image: VectorByte-logo_lg.png
-  data-background-size: contain
-  data-background-opacity: "0.2"
+title: "VectorByte Methods Training: Regression Review"
+author:
+  - name: Leah R. Johnson 
+    url: https://lrjohnson0.github.io/QEDLab/leahJ.html
+    affiliation: Virginia Tech and VectorByte
+citation: true
+date: 2024-07-01
+date-format: long
 format:
   html:
     toc: true
diff --git a/VB_TimeDepData.qmd b/VB_TimeDepData.qmd
index dd96516..5f75af3 100644
--- a/VB_TimeDepData.qmd
+++ b/VB_TimeDepData.qmd
@@ -1,6 +1,6 @@
 ---
-title: "VectorByte Methods Training"
-subtitle: "Regression Methods for Time Dependent Data"
+subtitle: "VectorByte Methods Training"
+title: "Regression Methods for Time Dependent Data"
 author: "The VectorByte Team (Leah R. Johnson, Virginia Tech)"
 title-slide-attributes:
   data-background-image: VectorByte-logo_lg.png
diff --git a/VB_TimeDepData_practical.qmd b/VB_TimeDepData_practical.qmd
index 7c56f31..8761f32 100644
--- a/VB_TimeDepData_practical.qmd
+++ b/VB_TimeDepData_practical.qmd
@@ -1,7 +1,12 @@
 ---
-title: "VectorByte Methods Training"
-subtitle: "Practical: Intro to Time Dependent Data"
-author: "The VectorByte Team (Leah R. Johnson, Virginia Tech)"
+title: "VectorByte Methods Training: Regression Methods for Time Dependent Data (practical)"
+author:
+  - name: Leah R. Johnson 
+    url: https://lrjohnson0.github.io/QEDLab/leahJ.html
+    affiliation: Virginia Tech and VectorByte
+citation: true
+date: 2024-07-01
+date-format: long
 format:
   html:
     toc: true
diff --git a/docs/Stats_review.html b/docs/Stats_review.html
index c986886..3c78bc3 100644
--- a/docs/Stats_review.html
+++ b/docs/Stats_review.html
@@ -6,9 +6,10 @@
 
 <meta name="viewport" content="width=device-width, initial-scale=1.0, user-scalable=yes">
 
-<meta name="author" content="The VectorByte Team (Leah R. Johnson, Virginia Tech)">
+<meta name="author" content="Leah R. Johnson">
+<meta name="dcterms.date" content="2024-07-01">
 
-<title>VectorByte Training 2024 - VectorByte Methods Training</title>
+<title>VectorByte Training 2024 - VectorByte Methods Training: Probability and Statistics Fundamentals</title>
 <style>
 code{white-space: pre-wrap;}
 span.smallcaps{font-variant: small-caps;}
@@ -254,21 +255,33 @@ <h2 id="toc-title">On this page</h2>
 
 <header id="title-block-header" class="quarto-title-block default">
 <div class="quarto-title">
-<h1 class="title">VectorByte Methods Training</h1>
-<p class="subtitle lead">Probability and Statistics Fundamentals</p>
+<h1 class="title">VectorByte Methods Training: Probability and Statistics Fundamentals</h1>
 </div>
 
 
+<div class="quarto-title-meta-author">
+  <div class="quarto-title-meta-heading">Author</div>
+  <div class="quarto-title-meta-heading">Affiliation</div>
+  
+    <div class="quarto-title-meta-contents">
+    <p class="author"><a href="https://lrjohnson0.github.io/QEDLab/leahJ.html">Leah R. Johnson</a> </p>
+  </div>
+  <div class="quarto-title-meta-contents">
+        <p class="affiliation">
+            Virginia Tech and VectorByte
+          </p>
+      </div>
+  </div>
 
 <div class="quarto-title-meta">
 
+      
     <div>
-    <div class="quarto-title-meta-heading">Author</div>
+    <div class="quarto-title-meta-heading">Published</div>
     <div class="quarto-title-meta-contents">
-             <p>The VectorByte Team (Leah R. Johnson, Virginia Tech) </p>
-          </div>
+      <p class="date">July 1, 2024</p>
+    </div>
   </div>
-    
   
     
   </div>
@@ -340,7 +353,7 @@ <h1>Random Variables (RVs)</h1>
 <li>discrete (numbers of items or successes)</li>
 <li>continuous (heights, times, weights)</li>
 </ul>
-<p>We usually use capital letters – e.g.&nbsp;<span class="math inline">X</span>, <span class="math inline">Y</span>, sometimes with bold or with subscripts – to denote the RVs. In contrast we use lower case letters, e.g.&nbsp;<span class="math inline">x</span>, <span class="math inline">y</span>, <span class="math inline">k</span>, to denote the values that the RV takes. For instance, lets say that the heights of the woman at Virginia Tech are the RV, <span class="math inline">X</span>, and <span class="math inline">X</span> has a normal distribution with mean 62 inches and variance 6<span class="math inline">^2</span>, i.e., <span class="math inline">X \sim \mathrm{N}(62,6^2)</span> distribution. Say we then observe the heights of 3 individuals drawn from this distribution – we would write this as: <span class="math inline">x=(</span> 64.5, 64, 60.1 <span class="math inline">)</span>.</p>
+<p>We usually use capital letters – e.g.&nbsp;<span class="math inline">X</span>, <span class="math inline">Y</span>, sometimes with bold or with subscripts – to denote the RVs. In contrast we use lower case letters, e.g.&nbsp;<span class="math inline">x</span>, <span class="math inline">y</span>, <span class="math inline">k</span>, to denote the values that the RV takes. For instance, lets say that the heights of the woman at Virginia Tech are the RV, <span class="math inline">X</span>, and <span class="math inline">X</span> has a normal distribution with mean 62 inches and variance 6<span class="math inline">^2</span>, i.e., <span class="math inline">X \sim \mathrm{N}(62,6^2)</span> distribution. Say we then observe the heights of 3 individuals drawn from this distribution – we would write this as: <span class="math inline">x=(</span> 60.3, 66.6, 56.1 <span class="math inline">)</span>.</p>
 <p><br> <br> </p>
 </section>
 <section id="probability-distributions" class="level1">
@@ -564,7 +577,7 @@ <h1>Probability Distributions in <code>R</code></h1>
 <div class="cell">
 <div class="sourceCode cell-code" id="cb3"><pre class="sourceCode r code-with-copy"><code class="sourceCode r"><span id="cb3-1"><a href="#cb3-1" aria-hidden="true" tabindex="-1"></a><span class="fu">rnorm</span>(<span class="dv">3</span>, <span class="at">mean=</span><span class="dv">0</span>, <span class="at">sd=</span><span class="dv">1</span>) <span class="do">## random draws</span></span></code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre></div>
 <div class="cell-output cell-output-stdout">
-<pre><code>[1] -1.3733147 -0.5293865  0.9294630</code></pre>
+<pre><code>[1]  1.2016687 -0.0771098 -0.1688577</code></pre>
 </div>
 </div>
 <div class="cell">
@@ -763,7 +776,17 @@ <h2 class="anchored" data-anchor-id="hypothesis-testing-and-confidence-intervals
 </section>
 </section>
 
-</main> <!-- /main -->
+<div id="quarto-appendix" class="default"><section class="quarto-appendix-contents" id="quarto-citation"><h2 class="anchored quarto-appendix-heading">Citation</h2><div><div class="quarto-appendix-secondary-label">BibTeX citation:</div><pre class="sourceCode code-with-copy quarto-appendix-bibtex"><code class="sourceCode bibtex">@online{r. johnson2024,
+  author = {R. Johnson, Leah},
+  title = {VectorByte {Methods} {Training:} {Probability} and
+    {Statistics} {Fundamentals}},
+  date = {2024-07-01},
+  langid = {en}
+}
+</code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre><div class="quarto-appendix-secondary-label">For attribution, please cite this work as:</div><div id="ref-r. johnson2024" class="csl-entry quarto-appendix-citeas" role="listitem">
+R. Johnson, Leah. 2024. <span>“VectorByte Methods Training: Probability
+and Statistics Fundamentals.”</span> July 1, 2024.
+</div></div></section></div></main> <!-- /main -->
 <script id="quarto-html-after-body" type="application/javascript">
 window.document.addEventListener("DOMContentLoaded", function (event) {
   const toggleBodyColorMode = (bsSheetEl) => {
diff --git a/docs/Stats_review_files/figure-html/unnamed-chunk-7-1.png b/docs/Stats_review_files/figure-html/unnamed-chunk-7-1.png
index 082b39c..98b974e 100644
Binary files a/docs/Stats_review_files/figure-html/unnamed-chunk-7-1.png and b/docs/Stats_review_files/figure-html/unnamed-chunk-7-1.png differ
diff --git a/docs/Stats_review_files/figure-html/unnamed-chunk-8-1.png b/docs/Stats_review_files/figure-html/unnamed-chunk-8-1.png
index 137c633..c561de3 100644
Binary files a/docs/Stats_review_files/figure-html/unnamed-chunk-8-1.png and b/docs/Stats_review_files/figure-html/unnamed-chunk-8-1.png differ
diff --git a/docs/Stats_review_files/figure-html/unnamed-chunk-9-1.png b/docs/Stats_review_files/figure-html/unnamed-chunk-9-1.png
index 64463e9..85b850b 100644
Binary files a/docs/Stats_review_files/figure-html/unnamed-chunk-9-1.png and b/docs/Stats_review_files/figure-html/unnamed-chunk-9-1.png differ
diff --git a/docs/VB_IntroTimeDepData_practical.html b/docs/VB_IntroTimeDepData_practical.html
deleted file mode 100644
index 5147d57..0000000
--- a/docs/VB_IntroTimeDepData_practical.html
+++ /dev/null
@@ -1,919 +0,0 @@
-<!DOCTYPE html>
-<html xmlns="http://www.w3.org/1999/xhtml" lang="en" xml:lang="en"><head>
-
-<meta charset="utf-8">
-<meta name="generator" content="quarto-1.4.552">
-
-<meta name="viewport" content="width=device-width, initial-scale=1.0, user-scalable=yes">
-
-<meta name="author" content="The VectorByte Team (Leah R. Johnson, Virginia Tech)">
-
-<title>VectorByte Training 2024 - VectorByte Methods Training</title>
-<style>
-code{white-space: pre-wrap;}
-span.smallcaps{font-variant: small-caps;}
-div.columns{display: flex; gap: min(4vw, 1.5em);}
-div.column{flex: auto; overflow-x: auto;}
-div.hanging-indent{margin-left: 1.5em; text-indent: -1.5em;}
-ul.task-list{list-style: none;}
-ul.task-list li input[type="checkbox"] {
-  width: 0.8em;
-  margin: 0 0.8em 0.2em -1em; /* quarto-specific, see https://github.com/quarto-dev/quarto-cli/issues/4556 */ 
-  vertical-align: middle;
-}
-/* CSS for syntax highlighting */
-pre > code.sourceCode { white-space: pre; position: relative; }
-pre > code.sourceCode > span { line-height: 1.25; }
-pre > code.sourceCode > span:empty { height: 1.2em; }
-.sourceCode { overflow: visible; }
-code.sourceCode > span { color: inherit; text-decoration: inherit; }
-div.sourceCode { margin: 1em 0; }
-pre.sourceCode { margin: 0; }
-@media screen {
-div.sourceCode { overflow: auto; }
-}
-@media print {
-pre > code.sourceCode { white-space: pre-wrap; }
-pre > code.sourceCode > span { text-indent: -5em; padding-left: 5em; }
-}
-pre.numberSource code
-  { counter-reset: source-line 0; }
-pre.numberSource code > span
-  { position: relative; left: -4em; counter-increment: source-line; }
-pre.numberSource code > span > a:first-child::before
-  { content: counter(source-line);
-    position: relative; left: -1em; text-align: right; vertical-align: baseline;
-    border: none; display: inline-block;
-    -webkit-touch-callout: none; -webkit-user-select: none;
-    -khtml-user-select: none; -moz-user-select: none;
-    -ms-user-select: none; user-select: none;
-    padding: 0 4px; width: 4em;
-  }
-pre.numberSource { margin-left: 3em;  padding-left: 4px; }
-div.sourceCode
-  {   }
-@media screen {
-pre > code.sourceCode > span > a:first-child::before { text-decoration: underline; }
-}
-</style>
-
-
-<script src="site_libs/quarto-nav/quarto-nav.js"></script>
-<script src="site_libs/quarto-nav/headroom.min.js"></script>
-<script src="site_libs/clipboard/clipboard.min.js"></script>
-<script src="site_libs/quarto-search/autocomplete.umd.js"></script>
-<script src="site_libs/quarto-search/fuse.min.js"></script>
-<script src="site_libs/quarto-search/quarto-search.js"></script>
-<meta name="quarto:offset" content="./">
-<script src="site_libs/quarto-html/quarto.js"></script>
-<script src="site_libs/quarto-html/popper.min.js"></script>
-<script src="site_libs/quarto-html/tippy.umd.min.js"></script>
-<script src="site_libs/quarto-html/anchor.min.js"></script>
-<link href="site_libs/quarto-html/tippy.css" rel="stylesheet">
-<link href="site_libs/quarto-html/quarto-syntax-highlighting.css" rel="stylesheet" id="quarto-text-highlighting-styles">
-<script src="site_libs/bootstrap/bootstrap.min.js"></script>
-<link href="site_libs/bootstrap/bootstrap-icons.css" rel="stylesheet">
-<link href="site_libs/bootstrap/bootstrap.min.css" rel="stylesheet" id="quarto-bootstrap" data-mode="light">
-<script id="quarto-search-options" type="application/json">{
-  "location": "navbar",
-  "copy-button": false,
-  "collapse-after": 3,
-  "panel-placement": "end",
-  "type": "overlay",
-  "limit": 50,
-  "keyboard-shortcut": [
-    "f",
-    "/",
-    "s"
-  ],
-  "show-item-context": false,
-  "language": {
-    "search-no-results-text": "No results",
-    "search-matching-documents-text": "matching documents",
-    "search-copy-link-title": "Copy link to search",
-    "search-hide-matches-text": "Hide additional matches",
-    "search-more-match-text": "more match in this document",
-    "search-more-matches-text": "more matches in this document",
-    "search-clear-button-title": "Clear",
-    "search-text-placeholder": "",
-    "search-detached-cancel-button-title": "Cancel",
-    "search-submit-button-title": "Submit",
-    "search-label": "Search"
-  }
-}</script>
-
-
-<link rel="stylesheet" href="styles.css">
-</head>
-
-<body class="floating nav-fixed">
-
-<div id="quarto-search-results"></div>
-  <header id="quarto-header" class="headroom fixed-top">
-    <nav class="navbar navbar-expand-lg " data-bs-theme="dark">
-      <div class="navbar-container container-fluid">
-      <div class="navbar-brand-container mx-auto">
-    <a href="./index.html" class="navbar-brand navbar-brand-logo">
-    <img src="./graphics/vblogoedit.png" alt="" class="navbar-logo">
-    </a>
-    <a class="navbar-brand" href="./index.html">
-    <span class="navbar-title">VectorByte Training 2024</span>
-    </a>
-  </div>
-            <div id="quarto-search" class="" title="Search"></div>
-          <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbarCollapse" aria-controls="navbarCollapse" aria-expanded="false" aria-label="Toggle navigation" onclick="if (window.quartoToggleHeadroom) { window.quartoToggleHeadroom(); }">
-  <span class="navbar-toggler-icon"></span>
-</button>
-          <div class="collapse navbar-collapse" id="navbarCollapse">
-            <ul class="navbar-nav navbar-nav-scroll me-auto">
-  <li class="nav-item">
-    <a class="nav-link" href="./about.html"> 
-<span class="menu-text">About</span></a>
-  </li>  
-  <li class="nav-item">
-    <a class="nav-link" href="./schedule2024.html"> 
-<span class="menu-text">Schedule</span></a>
-  </li>  
-  <li class="nav-item">
-    <a class="nav-link" href="./materials.html"> 
-<span class="menu-text">Materials</span></a>
-  </li>  
-</ul>
-            <ul class="navbar-nav navbar-nav-scroll ms-auto">
-  <li class="nav-item compact">
-    <a class="nav-link" href="https://github.com/VectorByteOrg/vectorbyte-training2024"> <i class="bi bi-github" role="img">
-</i> 
-<span class="menu-text"></span></a>
-  </li>  
-  <li class="nav-item compact">
-    <a class="nav-link" href="https://twitter.com/vectorbite_rcn"> <i class="bi bi-twitter" role="img">
-</i> 
-<span class="menu-text"></span></a>
-  </li>  
-</ul>
-          </div> <!-- /navcollapse -->
-          <div class="quarto-navbar-tools">
-</div>
-      </div> <!-- /container-fluid -->
-    </nav>
-</header>
-<!-- content -->
-<div id="quarto-content" class="quarto-container page-columns page-rows-contents page-layout-article page-navbar">
-<!-- sidebar -->
-  <nav id="quarto-sidebar" class="sidebar collapse collapse-horizontal quarto-sidebar-collapse-item sidebar-navigation floating overflow-auto">
-    <nav id="TOC" role="doc-toc" class="toc-active">
-    <h2 id="toc-title">On this page</h2>
-   
-  <ul>
-  <li><a href="#overview-and-instructions" id="toc-overview-and-instructions" class="nav-link active" data-scroll-target="#overview-and-instructions">Overview and Instructions</a></li>
-  <li><a href="#guided-example-monthly-average-mosquito-counts-in-walton-county-fl" id="toc-guided-example-monthly-average-mosquito-counts-in-walton-county-fl" class="nav-link" data-scroll-target="#guided-example-monthly-average-mosquito-counts-in-walton-county-fl">Guided example: Monthly average mosquito counts in Walton County, FL</a>
-  <ul class="collapse">
-  <li><a href="#exploring-the-data" id="toc-exploring-the-data" class="nav-link" data-scroll-target="#exploring-the-data">Exploring the Data</a></li>
-  <li><a href="#plotting-the-data" id="toc-plotting-the-data" class="nav-link" data-scroll-target="#plotting-the-data">Plotting the data</a></li>
-  <li><a href="#building-a-data-frame" id="toc-building-a-data-frame" class="nav-link" data-scroll-target="#building-a-data-frame">Building a data frame</a></li>
-  <li><a href="#building-a-first-model" id="toc-building-a-first-model" class="nav-link" data-scroll-target="#building-a-first-model">Building a first model</a></li>
-  </ul></li>
-  <li><a href="#build-and-compare-your-own-models" id="toc-build-and-compare-your-own-models" class="nav-link" data-scroll-target="#build-and-compare-your-own-models">Build and compare your own models</a></li>
-  <li><a href="#extra-practice" id="toc-extra-practice" class="nav-link" data-scroll-target="#extra-practice">Extra Practice</a></li>
-  </ul>
-</nav>
-</nav>
-<div id="quarto-sidebar-glass" class="quarto-sidebar-collapse-item" data-bs-toggle="collapse" data-bs-target=".quarto-sidebar-collapse-item"></div>
-<!-- margin-sidebar -->
-    <div id="quarto-margin-sidebar" class="sidebar margin-sidebar">
-    </div>
-<!-- main -->
-<main class="content" id="quarto-document-content">
-
-<header id="title-block-header" class="quarto-title-block default">
-<div class="quarto-title">
-<h1 class="title">VectorByte Methods Training</h1>
-<p class="subtitle lead">Practical: Intro to Time Dependent Data</p>
-</div>
-
-
-
-<div class="quarto-title-meta">
-
-    <div>
-    <div class="quarto-title-meta-heading">Author</div>
-    <div class="quarto-title-meta-contents">
-             <p>The VectorByte Team (Leah R. Johnson, Virginia Tech) </p>
-          </div>
-  </div>
-    
-  
-    
-  </div>
-  
-
-
-</header>
-
-
-<p><br></p>
-<section id="overview-and-instructions" class="level1">
-<h1>Overview and Instructions</h1>
-<p>The goal of this practical is to practice building models for time-dependent data using simple regression based techniques. This includes incorporated possible transformations, trying out different time dependent predictors (including lagged variables) and assessing model fit using diagnostic plots.</p>
-<p><br></p>
-</section>
-<section id="guided-example-monthly-average-mosquito-counts-in-walton-county-fl" class="level1">
-<h1>Guided example: Monthly average mosquito counts in Walton County, FL</h1>
-<p>The file <a href="data/Culex_erraticus_walton_covariates_aggregated.csv">Culex_erraticus_walton_covariates_aggregated.csv</a> on the course website contains data on <strong>average monthly counts of mosquitos</strong> (<code>sample_value</code>) in Walton, FL, together with monthly average maximum temperature (<code>MaxTemp</code> in C) and precipitation (<code>Precip</code> in inches) for each month from January 2015 through December 2017 (<code>Month_Yr</code>).</p>
-<section id="exploring-the-data" class="level2">
-<h2 class="anchored" data-anchor-id="exploring-the-data">Exploring the Data</h2>
-<p>As always, we first want to take a look at the data, to make sure we understand it, and that we don’t have missing or weird values.</p>
-<div class="cell">
-<div class="sourceCode cell-code" id="cb1"><pre class="sourceCode r code-with-copy"><code class="sourceCode r"><span id="cb1-1"><a href="#cb1-1" aria-hidden="true" tabindex="-1"></a>mozData<span class="ot">&lt;-</span><span class="fu">read.csv</span>(<span class="st">"data/Culex_erraticus_walton_covariates_aggregated.csv"</span>)</span>
-<span id="cb1-2"><a href="#cb1-2" aria-hidden="true" tabindex="-1"></a><span class="fu">summary</span>(mozData)</span></code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre></div>
-<div class="cell-output cell-output-stdout">
-<pre><code>   Month_Yr          sample_value        MaxTemp          Precip      
- Length:36          Min.   :0.00000   Min.   :16.02   Min.   : 0.000  
- Class :character   1st Qu.:0.04318   1st Qu.:22.99   1st Qu.: 2.162  
- Mode  :character   Median :0.73001   Median :26.69   Median : 4.606  
-                    Mean   :0.80798   Mean   :26.23   Mean   : 5.595  
-                    3rd Qu.:1.22443   3rd Qu.:30.70   3rd Qu.: 7.864  
-                    Max.   :3.00595   Max.   :33.31   Max.   :18.307  </code></pre>
-</div>
-</div>
-<p>We can see that the minimum observed average number of mosquitoes it zero, and max is only 3 (there are likely many zeros averaged over many days in the month). There don’t appear to be any <code>NA</code>s in the data. In this case the dataset itself is small enough that we can print the whole thing to ensure it’s complete:</p>
-<div class="cell">
-<div class="sourceCode cell-code" id="cb3"><pre class="sourceCode r code-with-copy"><code class="sourceCode r"><span id="cb3-1"><a href="#cb3-1" aria-hidden="true" tabindex="-1"></a>mozData</span></code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre></div>
-<div class="cell-output cell-output-stdout">
-<pre><code>   Month_Yr sample_value  MaxTemp       Precip
-1   2015-01  0.000000000 17.74602  3.303991888
-2   2015-02  0.018181818 17.87269 16.544265802
-3   2015-03  0.468085106 23.81767  2.405651215
-4   2015-04  1.619047619 26.03559  8.974406168
-5   2015-05  0.821428571 30.01602  0.567960943
-6   2015-06  3.005952381 31.12094  4.841342729
-7   2015-07  2.380952381 32.81130  3.849010353
-8   2015-08  1.826347305 32.56245  5.562845324
-9   2015-09  0.648809524 30.55155 10.409724627
-10  2015-10  0.988023952 27.22605  0.337750269
-11  2015-11  0.737804878 24.86768 18.306749680
-12  2015-12  0.142857143 22.46588  5.621475377
-13  2016-01  0.000000000 16.02406  3.550622029
-14  2016-02  0.020202020 19.42057 11.254680803
-15  2016-03  0.015151515 23.13610  4.785664728
-16  2016-04  0.026143791 24.98082  4.580424519
-17  2016-05  0.025252525 28.72884  0.053057634
-18  2016-06  0.833333333 30.96990  6.155417473
-19  2016-07  1.261363636 33.30509  4.496368193
-20  2016-08  1.685279188 32.09633 11.338749182
-21  2016-09  2.617142857 31.60575  2.868288451
-22  2016-10  1.212121212 29.14275  0.000000000
-23  2016-11  1.539772727 24.48482  0.005462681
-24  2016-12  0.771573604 20.46054 11.615521725
-25  2017-01  0.045454545 18.35473  0.000000000
-26  2017-02  0.036363636 23.65584  3.150710053
-27  2017-03  0.194285714 22.53573  1.430094952
-28  2017-04  0.436548223 26.15299  0.499381616
-29  2017-05  1.202020202 28.00173  6.580562663
-30  2017-06  0.834196891 29.48951 13.333939858
-31  2017-07  1.765363128 32.25135  7.493927035
-32  2017-08  0.744791667 31.86476  6.082113434
-33  2017-09  0.722222222 30.60566  4.631037395
-34  2017-10  0.142131980 27.73453 11.567112214
-35  2017-11  0.289772727 23.23140  1.195760473
-36  2017-12  0.009174312 18.93603  4.018254442</code></pre>
-</div>
-</div>
-</section>
-<section id="plotting-the-data" class="level2">
-<h2 class="anchored" data-anchor-id="plotting-the-data">Plotting the data</h2>
-<p>First we’ll examine the data itself, including the predictors:</p>
-<div class="cell" data-layout-align="center">
-<div class="sourceCode cell-code" id="cb5"><pre class="sourceCode r code-with-copy"><code class="sourceCode r"><span id="cb5-1"><a href="#cb5-1" aria-hidden="true" tabindex="-1"></a>months<span class="ot">&lt;-</span><span class="fu">dim</span>(mozData)[<span class="dv">1</span>]</span>
-<span id="cb5-2"><a href="#cb5-2" aria-hidden="true" tabindex="-1"></a>t<span class="ot">&lt;-</span><span class="dv">1</span><span class="sc">:</span>months <span class="do">## counter for months in the data set</span></span>
-<span id="cb5-3"><a href="#cb5-3" aria-hidden="true" tabindex="-1"></a><span class="fu">par</span>(<span class="at">mfrow=</span><span class="fu">c</span>(<span class="dv">3</span>,<span class="dv">1</span>))</span>
-<span id="cb5-4"><a href="#cb5-4" aria-hidden="true" tabindex="-1"></a><span class="fu">plot</span>(t, mozData<span class="sc">$</span>sample_value, <span class="at">type=</span><span class="st">"l"</span>, <span class="at">lwd=</span><span class="dv">2</span>, </span>
-<span id="cb5-5"><a href="#cb5-5" aria-hidden="true" tabindex="-1"></a>     <span class="at">main=</span><span class="st">"Average Monthly Abundance"</span>, </span>
-<span id="cb5-6"><a href="#cb5-6" aria-hidden="true" tabindex="-1"></a>     <span class="at">xlab =</span><span class="st">"Time (months)"</span>, </span>
-<span id="cb5-7"><a href="#cb5-7" aria-hidden="true" tabindex="-1"></a>     <span class="at">ylab =</span> <span class="st">"Average Count"</span>)</span>
-<span id="cb5-8"><a href="#cb5-8" aria-hidden="true" tabindex="-1"></a><span class="fu">plot</span>(t, mozData<span class="sc">$</span>MaxTemp, <span class="at">type=</span><span class="st">"l"</span>,</span>
-<span id="cb5-9"><a href="#cb5-9" aria-hidden="true" tabindex="-1"></a>     <span class="at">col =</span> <span class="dv">2</span>, <span class="at">lwd=</span><span class="dv">2</span>, </span>
-<span id="cb5-10"><a href="#cb5-10" aria-hidden="true" tabindex="-1"></a>     <span class="at">main=</span><span class="st">"Average Maximum Temp"</span>, </span>
-<span id="cb5-11"><a href="#cb5-11" aria-hidden="true" tabindex="-1"></a>     <span class="at">xlab =</span><span class="st">"Time (months)"</span>, </span>
-<span id="cb5-12"><a href="#cb5-12" aria-hidden="true" tabindex="-1"></a>     <span class="at">ylab =</span> <span class="st">"Temperature (C)"</span>)</span>
-<span id="cb5-13"><a href="#cb5-13" aria-hidden="true" tabindex="-1"></a><span class="fu">plot</span>(t, mozData<span class="sc">$</span>Precip, <span class="at">type=</span><span class="st">"l"</span>,</span>
-<span id="cb5-14"><a href="#cb5-14" aria-hidden="true" tabindex="-1"></a>     <span class="at">col=</span><span class="st">"dodgerblue"</span>, <span class="at">lwd=</span><span class="dv">2</span>,</span>
-<span id="cb5-15"><a href="#cb5-15" aria-hidden="true" tabindex="-1"></a>     <span class="at">main=</span><span class="st">"Average Monthly Precip"</span>, </span>
-<span id="cb5-16"><a href="#cb5-16" aria-hidden="true" tabindex="-1"></a>     <span class="at">xlab =</span><span class="st">"Time (months)"</span>, </span>
-<span id="cb5-17"><a href="#cb5-17" aria-hidden="true" tabindex="-1"></a>     <span class="at">ylab =</span> <span class="st">"Precipitation (in)"</span>)</span></code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre></div>
-<div class="cell-output-display">
-<div class="quarto-figure quarto-figure-center">
-<figure class="figure">
-<p><img src="VB_IntroTimeDepData_practical_files/figure-html/unnamed-chunk-3-1.png" class="img-fluid quarto-figure quarto-figure-center figure-img" width="768"></p>
-</figure>
-</div>
-</div>
-</div>
-<p>Visually we noticed that there may be a bit of clumping in the values for abundance (this is subtle) – in particular, since we have a lot of very small/nearly zero counts, a transform, such as a square root, may spread things out for the abundances. It also looks like both the abundance and temperature data are more cyclical than the precipitation, and thus more likely to be related to each other. There’s also not visually a lot of indication of a trend, but it’s usually worthwhile to consider it anyway. Replotting the abundance data with a transformation:</p>
-<div class="cell" data-layout-align="center">
-<div class="sourceCode cell-code" id="cb6"><pre class="sourceCode r code-with-copy"><code class="sourceCode r"><span id="cb6-1"><a href="#cb6-1" aria-hidden="true" tabindex="-1"></a>months<span class="ot">&lt;-</span><span class="fu">dim</span>(mozData)[<span class="dv">1</span>]</span>
-<span id="cb6-2"><a href="#cb6-2" aria-hidden="true" tabindex="-1"></a>t<span class="ot">&lt;-</span><span class="dv">1</span><span class="sc">:</span>months <span class="do">## counter for months in the data set</span></span>
-<span id="cb6-3"><a href="#cb6-3" aria-hidden="true" tabindex="-1"></a><span class="fu">plot</span>(t, <span class="fu">sqrt</span>(mozData<span class="sc">$</span>sample_value), <span class="at">type=</span><span class="st">"l"</span>, <span class="at">lwd=</span><span class="dv">2</span>, </span>
-<span id="cb6-4"><a href="#cb6-4" aria-hidden="true" tabindex="-1"></a>     <span class="at">main=</span><span class="st">"Sqrt Average Monthly Abundance"</span>, </span>
-<span id="cb6-5"><a href="#cb6-5" aria-hidden="true" tabindex="-1"></a>     <span class="at">xlab =</span><span class="st">"Time (months)"</span>, </span>
-<span id="cb6-6"><a href="#cb6-6" aria-hidden="true" tabindex="-1"></a>     <span class="at">ylab =</span> <span class="st">"Average Count"</span>)</span></code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre></div>
-<div class="cell-output-display">
-<div class="quarto-figure quarto-figure-center">
-<figure class="figure">
-<p><img src="VB_IntroTimeDepData_practical_files/figure-html/unnamed-chunk-4-1.png" class="img-fluid quarto-figure quarto-figure-center figure-img" width="768"></p>
-</figure>
-</div>
-</div>
-</div>
-<p>That looks a little bit better. I suggest we go with this for our response.</p>
-</section>
-<section id="building-a-data-frame" class="level2">
-<h2 class="anchored" data-anchor-id="building-a-data-frame">Building a data frame</h2>
-<p>Before we get into model building, we always want to build a data frame to contain all of the predictors that we want to consider, at the potential lags that we’re interested in. In the lecture we saw building the AR, sine/cosine, and trend predictors:</p>
-<div class="cell">
-<div class="sourceCode cell-code" id="cb7"><pre class="sourceCode r code-with-copy"><code class="sourceCode r"><span id="cb7-1"><a href="#cb7-1" aria-hidden="true" tabindex="-1"></a>t <span class="ot">&lt;-</span> <span class="dv">2</span><span class="sc">:</span>months <span class="do">## to make building the AR1 predictors easier</span></span>
-<span id="cb7-2"><a href="#cb7-2" aria-hidden="true" tabindex="-1"></a></span>
-<span id="cb7-3"><a href="#cb7-3" aria-hidden="true" tabindex="-1"></a>mozTS <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(</span>
-<span id="cb7-4"><a href="#cb7-4" aria-hidden="true" tabindex="-1"></a>  <span class="at">Y=</span><span class="fu">sqrt</span>(mozData<span class="sc">$</span>sample_value[t]), <span class="co"># transformed response</span></span>
-<span id="cb7-5"><a href="#cb7-5" aria-hidden="true" tabindex="-1"></a>  <span class="at">Yl1=</span><span class="fu">sqrt</span>(mozData<span class="sc">$</span>sample_value[t<span class="dv">-1</span>]), <span class="co"># AR1 predictor</span></span>
-<span id="cb7-6"><a href="#cb7-6" aria-hidden="true" tabindex="-1"></a>  <span class="at">t=</span>t, <span class="co"># trend predictor</span></span>
-<span id="cb7-7"><a href="#cb7-7" aria-hidden="true" tabindex="-1"></a>  <span class="at">sin12=</span><span class="fu">sin</span>(<span class="dv">2</span><span class="sc">*</span>pi<span class="sc">*</span>t<span class="sc">/</span><span class="dv">12</span>), </span>
-<span id="cb7-8"><a href="#cb7-8" aria-hidden="true" tabindex="-1"></a>  <span class="at">cos12=</span><span class="fu">cos</span>(<span class="dv">2</span><span class="sc">*</span>pi<span class="sc">*</span>t<span class="sc">/</span><span class="dv">12</span>) <span class="co"># periodic predictors</span></span>
-<span id="cb7-9"><a href="#cb7-9" aria-hidden="true" tabindex="-1"></a>  )</span></code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre></div>
-</div>
-<p>We will also put in the temperature and precipitation predictors. But we need to think about what might be an appropriate lag. If this were daily or weekly data, we’d probably want to have a fairly sizable lag – mosquitoes take a while to develop, so the number we see today is not likely related to the temperature today. However, since these data are agregated across a whole month, as is the temperature/precipitaion, the current month values are likely to be useful. However, it’s even possible that last month’s values may be so we’ll add those in as well:</p>
-<div class="cell">
-<div class="sourceCode cell-code" id="cb8"><pre class="sourceCode r code-with-copy"><code class="sourceCode r"><span id="cb8-1"><a href="#cb8-1" aria-hidden="true" tabindex="-1"></a>mozTS<span class="sc">$</span>MaxTemp<span class="ot">&lt;-</span>mozData<span class="sc">$</span>MaxTemp[t] <span class="do">## current temps</span></span>
-<span id="cb8-2"><a href="#cb8-2" aria-hidden="true" tabindex="-1"></a>mozTS<span class="sc">$</span>MaxTempl1<span class="ot">&lt;-</span>mozData<span class="sc">$</span>MaxTemp[t<span class="dv">-1</span>] <span class="do">## previous temps</span></span>
-<span id="cb8-3"><a href="#cb8-3" aria-hidden="true" tabindex="-1"></a>mozTS<span class="sc">$</span>Precip<span class="ot">&lt;-</span>mozData<span class="sc">$</span>Precip[t] <span class="do">## current precip</span></span>
-<span id="cb8-4"><a href="#cb8-4" aria-hidden="true" tabindex="-1"></a>mozTS<span class="sc">$</span>Precipl1<span class="ot">&lt;-</span>mozData<span class="sc">$</span>Precip[t<span class="dv">-1</span>] <span class="do">## previous precip</span></span></code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre></div>
-</div>
-<p>Thus our full dataframe:</p>
-<div class="cell">
-<div class="sourceCode cell-code" id="cb9"><pre class="sourceCode r code-with-copy"><code class="sourceCode r"><span id="cb9-1"><a href="#cb9-1" aria-hidden="true" tabindex="-1"></a><span class="fu">summary</span>(mozTS)</span></code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre></div>
-<div class="cell-output cell-output-stdout">
-<pre><code>       Y               Yl1               t            sin12         
- Min.   :0.0000   Min.   :0.0000   Min.   : 2.0   Min.   :-1.00000  
- 1st Qu.:0.2951   1st Qu.:0.2951   1st Qu.:10.5   1st Qu.:-0.68301  
- Median :0.8590   Median :0.8590   Median :19.0   Median : 0.00000  
- Mean   :0.7711   Mean   :0.7684   Mean   :19.0   Mean   :-0.01429  
- 3rd Qu.:1.1120   3rd Qu.:1.1120   3rd Qu.:27.5   3rd Qu.: 0.68301  
- Max.   :1.7338   Max.   :1.7338   Max.   :36.0   Max.   : 1.00000  
-     cos12             MaxTemp        MaxTempl1         Precip      
- Min.   :-1.00000   Min.   :16.02   Min.   :16.02   Min.   : 0.000  
- 1st Qu.:-0.68301   1st Qu.:23.18   1st Qu.:23.18   1st Qu.: 1.918  
- Median : 0.00000   Median :27.23   Median :27.23   Median : 4.631  
- Mean   :-0.02474   Mean   :26.47   Mean   :26.44   Mean   : 5.660  
- 3rd Qu.: 0.50000   3rd Qu.:30.79   3rd Qu.:30.79   3rd Qu.: 8.234  
- Max.   : 1.00000   Max.   :33.31   Max.   :33.31   Max.   :18.307  
-    Precipl1     
- Min.   : 0.000  
- 1st Qu.: 1.918  
- Median : 4.631  
- Mean   : 5.640  
- 3rd Qu.: 8.234  
- Max.   :18.307  </code></pre>
-</div>
-</div>
-<div class="cell">
-<div class="sourceCode cell-code" id="cb11"><pre class="sourceCode r code-with-copy"><code class="sourceCode r"><span id="cb11-1"><a href="#cb11-1" aria-hidden="true" tabindex="-1"></a><span class="fu">head</span>(mozTS)</span></code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre></div>
-<div class="cell-output cell-output-stdout">
-<pre><code>          Y       Yl1 t         sin12         cos12  MaxTemp MaxTempl1
-1 0.1348400 0.0000000 2  8.660254e-01  5.000000e-01 17.87269  17.74602
-2 0.6841675 0.1348400 3  1.000000e+00  6.123234e-17 23.81767  17.87269
-3 1.2724180 0.6841675 4  8.660254e-01 -5.000000e-01 26.03559  23.81767
-4 0.9063270 1.2724180 5  5.000000e-01 -8.660254e-01 30.01602  26.03559
-5 1.7337683 0.9063270 6  1.224647e-16 -1.000000e+00 31.12094  30.01602
-6 1.5430335 1.7337683 7 -5.000000e-01 -8.660254e-01 32.81130  31.12094
-      Precip   Precipl1
-1 16.5442658  3.3039919
-2  2.4056512 16.5442658
-3  8.9744062  2.4056512
-4  0.5679609  8.9744062
-5  4.8413427  0.5679609
-6  3.8490104  4.8413427</code></pre>
-</div>
-</div>
-</section>
-<section id="building-a-first-model" class="level2">
-<h2 class="anchored" data-anchor-id="building-a-first-model">Building a first model</h2>
-<p>We will first build a very simple model – just a trend – to practice building the model, checking diagnostics, and plotting predictions.</p>
-<div class="cell">
-<div class="sourceCode cell-code" id="cb13"><pre class="sourceCode r code-with-copy"><code class="sourceCode r"><span id="cb13-1"><a href="#cb13-1" aria-hidden="true" tabindex="-1"></a>mod1<span class="ot">&lt;-</span><span class="fu">lm</span>(Y <span class="sc">~</span> t, <span class="at">data=</span>mozTS)</span>
-<span id="cb13-2"><a href="#cb13-2" aria-hidden="true" tabindex="-1"></a><span class="fu">summary</span>(mod1)</span></code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre></div>
-<div class="cell-output cell-output-stdout">
-<pre><code>
-Call:
-lm(formula = Y ~ t, data = mozTS)
-
-Residuals:
-     Min       1Q   Median       3Q      Max 
--0.81332 -0.47902  0.03671  0.37384  0.87119 
-
-Coefficients:
-             Estimate Std. Error t value Pr(&gt;|t|)    
-(Intercept)  0.904809   0.178421   5.071  1.5e-05 ***
-t           -0.007038   0.008292  -0.849    0.402    
----
-Signif. codes:  0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1
-
-Residual standard error: 0.4954 on 33 degrees of freedom
-Multiple R-squared:  0.02136,   Adjusted R-squared:  -0.008291 
-F-statistic: 0.7204 on 1 and 33 DF,  p-value: 0.4021</code></pre>
-</div>
-</div>
-<p>The model output indicates that this model is not useful – the trend is not significant and it only explains about 2% of the variability. Let’s plot the predictions:</p>
-<div class="cell" data-layout-align="center">
-<div class="sourceCode cell-code" id="cb15"><pre class="sourceCode r code-with-copy"><code class="sourceCode r"><span id="cb15-1"><a href="#cb15-1" aria-hidden="true" tabindex="-1"></a><span class="do">## plot points and fitted lines</span></span>
-<span id="cb15-2"><a href="#cb15-2" aria-hidden="true" tabindex="-1"></a><span class="fu">plot</span>(Y<span class="sc">~</span>t, <span class="at">data=</span>mozTS, <span class="at">col=</span><span class="dv">1</span>, <span class="at">type=</span><span class="st">"l"</span>)</span>
-<span id="cb15-3"><a href="#cb15-3" aria-hidden="true" tabindex="-1"></a><span class="fu">lines</span>(t, mod1<span class="sc">$</span>fitted, <span class="at">col=</span><span class="st">"dodgerblue"</span>, <span class="at">lwd=</span><span class="dv">2</span>)</span></code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre></div>
-<div class="cell-output-display">
-<div class="quarto-figure quarto-figure-center">
-<figure class="figure">
-<p><img src="VB_IntroTimeDepData_practical_files/figure-html/unnamed-chunk-10-1.png" class="img-fluid quarto-figure quarto-figure-center figure-img" width="480"></p>
-</figure>
-</div>
-</div>
-</div>
-<p>Not good – we’ll definitely need to try something else! Remember that since we’re using a linear model for this, that we should check our residual plots as usual, and then also plot the <code>acf</code> of the residuals:</p>
-<div class="cell" data-layout-align="center">
-<div class="sourceCode cell-code" id="cb16"><pre class="sourceCode r code-with-copy"><code class="sourceCode r"><span id="cb16-1"><a href="#cb16-1" aria-hidden="true" tabindex="-1"></a><span class="fu">par</span>(<span class="at">mfrow=</span><span class="fu">c</span>(<span class="dv">1</span>,<span class="dv">3</span>), <span class="at">mar=</span><span class="fu">c</span>(<span class="dv">4</span>,<span class="dv">4</span>,<span class="dv">2</span>,<span class="fl">0.5</span>))   </span>
-<span id="cb16-2"><a href="#cb16-2" aria-hidden="true" tabindex="-1"></a></span>
-<span id="cb16-3"><a href="#cb16-3" aria-hidden="true" tabindex="-1"></a><span class="do">## studentized residuals vs fitted</span></span>
-<span id="cb16-4"><a href="#cb16-4" aria-hidden="true" tabindex="-1"></a><span class="fu">plot</span>(mod1<span class="sc">$</span>fitted, <span class="fu">rstudent</span>(mod1), <span class="at">col=</span><span class="dv">1</span>,</span>
-<span id="cb16-5"><a href="#cb16-5" aria-hidden="true" tabindex="-1"></a>     <span class="at">xlab=</span><span class="st">"Fitted Values"</span>, </span>
-<span id="cb16-6"><a href="#cb16-6" aria-hidden="true" tabindex="-1"></a>     <span class="at">ylab=</span><span class="st">"Studentized Residuals"</span>, </span>
-<span id="cb16-7"><a href="#cb16-7" aria-hidden="true" tabindex="-1"></a>     <span class="at">pch=</span><span class="dv">20</span>, <span class="at">main=</span><span class="st">"AR 1 only model"</span>)</span>
-<span id="cb16-8"><a href="#cb16-8" aria-hidden="true" tabindex="-1"></a></span>
-<span id="cb16-9"><a href="#cb16-9" aria-hidden="true" tabindex="-1"></a><span class="do">## qq plot of studentized residuals</span></span>
-<span id="cb16-10"><a href="#cb16-10" aria-hidden="true" tabindex="-1"></a><span class="fu">qqnorm</span>(<span class="fu">rstudent</span>(mod1), <span class="at">pch=</span><span class="dv">20</span>, <span class="at">col=</span><span class="dv">1</span>, <span class="at">main=</span><span class="st">""</span> )</span>
-<span id="cb16-11"><a href="#cb16-11" aria-hidden="true" tabindex="-1"></a><span class="fu">abline</span>(<span class="at">a=</span><span class="dv">0</span>,<span class="at">b=</span><span class="dv">1</span>,<span class="at">lty=</span><span class="dv">2</span>, <span class="at">col=</span><span class="dv">2</span>)</span>
-<span id="cb16-12"><a href="#cb16-12" aria-hidden="true" tabindex="-1"></a></span>
-<span id="cb16-13"><a href="#cb16-13" aria-hidden="true" tabindex="-1"></a><span class="do">## histogram of studentized residuals</span></span>
-<span id="cb16-14"><a href="#cb16-14" aria-hidden="true" tabindex="-1"></a><span class="fu">hist</span>(<span class="fu">rstudent</span>(mod1), <span class="at">col=</span><span class="dv">1</span>, </span>
-<span id="cb16-15"><a href="#cb16-15" aria-hidden="true" tabindex="-1"></a>     <span class="at">xlab=</span><span class="st">"Studentized Residuals"</span>, </span>
-<span id="cb16-16"><a href="#cb16-16" aria-hidden="true" tabindex="-1"></a>     <span class="at">main=</span><span class="st">""</span>, <span class="at">border=</span><span class="dv">8</span>)</span></code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre></div>
-<div class="cell-output-display">
-<div class="quarto-figure quarto-figure-center">
-<figure class="figure">
-<p><img src="VB_IntroTimeDepData_practical_files/figure-html/unnamed-chunk-11-1.png" class="img-fluid quarto-figure quarto-figure-center figure-img" width="768"></p>
-</figure>
-</div>
-</div>
-</div>
-<p>This doesn’t look really bad, although the histogram might be a bit weird. Finally the <code>acf</code></p>
-<div class="cell" data-layout-align="center">
-<div class="sourceCode cell-code" id="cb17"><pre class="sourceCode r code-with-copy"><code class="sourceCode r"><span id="cb17-1"><a href="#cb17-1" aria-hidden="true" tabindex="-1"></a><span class="fu">acf</span>(mod1<span class="sc">$</span>residuals)</span></code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre></div>
-<div class="cell-output-display">
-<div class="quarto-figure quarto-figure-center">
-<figure class="figure">
-<p><img src="VB_IntroTimeDepData_practical_files/figure-html/unnamed-chunk-12-1.png" class="img-fluid quarto-figure quarto-figure-center figure-img" width="768"></p>
-</figure>
-</div>
-</div>
-</div>
-<p>This is where we can see that we definitely aren’t able to capture the pattern. There’s substantial autocorrelation left at a 1 month lag, and around 6 months.</p>
-<p>Finally, for moving forward, we can extract the BIC for this model so that we can compare with other models that you’ll build next.</p>
-<div class="cell">
-<div class="sourceCode cell-code" id="cb18"><pre class="sourceCode r code-with-copy"><code class="sourceCode r"><span id="cb18-1"><a href="#cb18-1" aria-hidden="true" tabindex="-1"></a>n<span class="ot">&lt;-</span><span class="fu">length</span>(t)</span>
-<span id="cb18-2"><a href="#cb18-2" aria-hidden="true" tabindex="-1"></a><span class="fu">extractAIC</span>(mod1, <span class="at">k=</span><span class="fu">log</span>(n))[<span class="dv">2</span>]</span></code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre></div>
-<div class="cell-output cell-output-stdout">
-<pre><code>[1] -44.11057</code></pre>
-</div>
-</div>
-</section>
-</section>
-<section id="build-and-compare-your-own-models" class="level1">
-<h1>Build and compare your own models</h1>
-<p>Follow the procedure I showed for the model with a simple trend, and build <strong><em>at least</em></strong> 4 more models:</p>
-<ol type="1">
-<li>one that contains an AR term</li>
-<li>one with the sine/cosine terms</li>
-<li>one with the environmental predictors</li>
-<li>one with a combination</li>
-</ol>
-<p>Check diagnostics/model assumptions as you go. Then at the end compare all of your models via BIC. What is your best model by that metric? We’ll share among the group what folks found to be good models.</p>
-</section>
-<section id="extra-practice" class="level1">
-<h1>Extra Practice</h1>
-<p>Imagine that you are missing a few months at random – how would you need to modify the analysis. Try it out by removing about 5 months not at the beginning or end of the time series.</p>
-
-
-</section>
-
-</main> <!-- /main -->
-<script id="quarto-html-after-body" type="application/javascript">
-window.document.addEventListener("DOMContentLoaded", function (event) {
-  const toggleBodyColorMode = (bsSheetEl) => {
-    const mode = bsSheetEl.getAttribute("data-mode");
-    const bodyEl = window.document.querySelector("body");
-    if (mode === "dark") {
-      bodyEl.classList.add("quarto-dark");
-      bodyEl.classList.remove("quarto-light");
-    } else {
-      bodyEl.classList.add("quarto-light");
-      bodyEl.classList.remove("quarto-dark");
-    }
-  }
-  const toggleBodyColorPrimary = () => {
-    const bsSheetEl = window.document.querySelector("link#quarto-bootstrap");
-    if (bsSheetEl) {
-      toggleBodyColorMode(bsSheetEl);
-    }
-  }
-  toggleBodyColorPrimary();  
-  const icon = "";
-  const anchorJS = new window.AnchorJS();
-  anchorJS.options = {
-    placement: 'right',
-    icon: icon
-  };
-  anchorJS.add('.anchored');
-  const isCodeAnnotation = (el) => {
-    for (const clz of el.classList) {
-      if (clz.startsWith('code-annotation-')) {                     
-        return true;
-      }
-    }
-    return false;
-  }
-  const clipboard = new window.ClipboardJS('.code-copy-button', {
-    text: function(trigger) {
-      const codeEl = trigger.previousElementSibling.cloneNode(true);
-      for (const childEl of codeEl.children) {
-        if (isCodeAnnotation(childEl)) {
-          childEl.remove();
-        }
-      }
-      return codeEl.innerText;
-    }
-  });
-  clipboard.on('success', function(e) {
-    // button target
-    const button = e.trigger;
-    // don't keep focus
-    button.blur();
-    // flash "checked"
-    button.classList.add('code-copy-button-checked');
-    var currentTitle = button.getAttribute("title");
-    button.setAttribute("title", "Copied!");
-    let tooltip;
-    if (window.bootstrap) {
-      button.setAttribute("data-bs-toggle", "tooltip");
-      button.setAttribute("data-bs-placement", "left");
-      button.setAttribute("data-bs-title", "Copied!");
-      tooltip = new bootstrap.Tooltip(button, 
-        { trigger: "manual", 
-          customClass: "code-copy-button-tooltip",
-          offset: [0, -8]});
-      tooltip.show();    
-    }
-    setTimeout(function() {
-      if (tooltip) {
-        tooltip.hide();
-        button.removeAttribute("data-bs-title");
-        button.removeAttribute("data-bs-toggle");
-        button.removeAttribute("data-bs-placement");
-      }
-      button.setAttribute("title", currentTitle);
-      button.classList.remove('code-copy-button-checked');
-    }, 1000);
-    // clear code selection
-    e.clearSelection();
-  });
-    var localhostRegex = new RegExp(/^(?:http|https):\/\/localhost\:?[0-9]*\//);
-    var mailtoRegex = new RegExp(/^mailto:/);
-      var filterRegex = new RegExp('/' + window.location.host + '/');
-    var isInternal = (href) => {
-        return filterRegex.test(href) || localhostRegex.test(href) || mailtoRegex.test(href);
-    }
-    // Inspect non-navigation links and adorn them if external
- 	var links = window.document.querySelectorAll('a[href]:not(.nav-link):not(.navbar-brand):not(.toc-action):not(.sidebar-link):not(.sidebar-item-toggle):not(.pagination-link):not(.no-external):not([aria-hidden]):not(.dropdown-item):not(.quarto-navigation-tool)');
-    for (var i=0; i<links.length; i++) {
-      const link = links[i];
-      if (!isInternal(link.href)) {
-        // undo the damage that might have been done by quarto-nav.js in the case of
-        // links that we want to consider external
-        if (link.dataset.originalHref !== undefined) {
-          link.href = link.dataset.originalHref;
-        }
-      }
-    }
-  function tippyHover(el, contentFn, onTriggerFn, onUntriggerFn) {
-    const config = {
-      allowHTML: true,
-      maxWidth: 500,
-      delay: 100,
-      arrow: false,
-      appendTo: function(el) {
-          return el.parentElement;
-      },
-      interactive: true,
-      interactiveBorder: 10,
-      theme: 'quarto',
-      placement: 'bottom-start',
-    };
-    if (contentFn) {
-      config.content = contentFn;
-    }
-    if (onTriggerFn) {
-      config.onTrigger = onTriggerFn;
-    }
-    if (onUntriggerFn) {
-      config.onUntrigger = onUntriggerFn;
-    }
-    window.tippy(el, config); 
-  }
-  const noterefs = window.document.querySelectorAll('a[role="doc-noteref"]');
-  for (var i=0; i<noterefs.length; i++) {
-    const ref = noterefs[i];
-    tippyHover(ref, function() {
-      // use id or data attribute instead here
-      let href = ref.getAttribute('data-footnote-href') || ref.getAttribute('href');
-      try { href = new URL(href).hash; } catch {}
-      const id = href.replace(/^#\/?/, "");
-      const note = window.document.getElementById(id);
-      if (note) {
-        return note.innerHTML;
-      } else {
-        return "";
-      }
-    });
-  }
-  const xrefs = window.document.querySelectorAll('a.quarto-xref');
-  const processXRef = (id, note) => {
-    // Strip column container classes
-    const stripColumnClz = (el) => {
-      el.classList.remove("page-full", "page-columns");
-      if (el.children) {
-        for (const child of el.children) {
-          stripColumnClz(child);
-        }
-      }
-    }
-    stripColumnClz(note)
-    if (id === null || id.startsWith('sec-')) {
-      // Special case sections, only their first couple elements
-      const container = document.createElement("div");
-      if (note.children && note.children.length > 2) {
-        container.appendChild(note.children[0].cloneNode(true));
-        for (let i = 1; i < note.children.length; i++) {
-          const child = note.children[i];
-          if (child.tagName === "P" && child.innerText === "") {
-            continue;
-          } else {
-            container.appendChild(child.cloneNode(true));
-            break;
-          }
-        }
-        if (window.Quarto?.typesetMath) {
-          window.Quarto.typesetMath(container);
-        }
-        return container.innerHTML
-      } else {
-        if (window.Quarto?.typesetMath) {
-          window.Quarto.typesetMath(note);
-        }
-        return note.innerHTML;
-      }
-    } else {
-      // Remove any anchor links if they are present
-      const anchorLink = note.querySelector('a.anchorjs-link');
-      if (anchorLink) {
-        anchorLink.remove();
-      }
-      if (window.Quarto?.typesetMath) {
-        window.Quarto.typesetMath(note);
-      }
-      // TODO in 1.5, we should make sure this works without a callout special case
-      if (note.classList.contains("callout")) {
-        return note.outerHTML;
-      } else {
-        return note.innerHTML;
-      }
-    }
-  }
-  for (var i=0; i<xrefs.length; i++) {
-    const xref = xrefs[i];
-    tippyHover(xref, undefined, function(instance) {
-      instance.disable();
-      let url = xref.getAttribute('href');
-      let hash = undefined; 
-      if (url.startsWith('#')) {
-        hash = url;
-      } else {
-        try { hash = new URL(url).hash; } catch {}
-      }
-      if (hash) {
-        const id = hash.replace(/^#\/?/, "");
-        const note = window.document.getElementById(id);
-        if (note !== null) {
-          try {
-            const html = processXRef(id, note.cloneNode(true));
-            instance.setContent(html);
-          } finally {
-            instance.enable();
-            instance.show();
-          }
-        } else {
-          // See if we can fetch this
-          fetch(url.split('#')[0])
-          .then(res => res.text())
-          .then(html => {
-            const parser = new DOMParser();
-            const htmlDoc = parser.parseFromString(html, "text/html");
-            const note = htmlDoc.getElementById(id);
-            if (note !== null) {
-              const html = processXRef(id, note);
-              instance.setContent(html);
-            } 
-          }).finally(() => {
-            instance.enable();
-            instance.show();
-          });
-        }
-      } else {
-        // See if we can fetch a full url (with no hash to target)
-        // This is a special case and we should probably do some content thinning / targeting
-        fetch(url)
-        .then(res => res.text())
-        .then(html => {
-          const parser = new DOMParser();
-          const htmlDoc = parser.parseFromString(html, "text/html");
-          const note = htmlDoc.querySelector('main.content');
-          if (note !== null) {
-            // This should only happen for chapter cross references
-            // (since there is no id in the URL)
-            // remove the first header
-            if (note.children.length > 0 && note.children[0].tagName === "HEADER") {
-              note.children[0].remove();
-            }
-            const html = processXRef(null, note);
-            instance.setContent(html);
-          } 
-        }).finally(() => {
-          instance.enable();
-          instance.show();
-        });
-      }
-    }, function(instance) {
-    });
-  }
-      let selectedAnnoteEl;
-      const selectorForAnnotation = ( cell, annotation) => {
-        let cellAttr = 'data-code-cell="' + cell + '"';
-        let lineAttr = 'data-code-annotation="' +  annotation + '"';
-        const selector = 'span[' + cellAttr + '][' + lineAttr + ']';
-        return selector;
-      }
-      const selectCodeLines = (annoteEl) => {
-        const doc = window.document;
-        const targetCell = annoteEl.getAttribute("data-target-cell");
-        const targetAnnotation = annoteEl.getAttribute("data-target-annotation");
-        const annoteSpan = window.document.querySelector(selectorForAnnotation(targetCell, targetAnnotation));
-        const lines = annoteSpan.getAttribute("data-code-lines").split(",");
-        const lineIds = lines.map((line) => {
-          return targetCell + "-" + line;
-        })
-        let top = null;
-        let height = null;
-        let parent = null;
-        if (lineIds.length > 0) {
-            //compute the position of the single el (top and bottom and make a div)
-            const el = window.document.getElementById(lineIds[0]);
-            top = el.offsetTop;
-            height = el.offsetHeight;
-            parent = el.parentElement.parentElement;
-          if (lineIds.length > 1) {
-            const lastEl = window.document.getElementById(lineIds[lineIds.length - 1]);
-            const bottom = lastEl.offsetTop + lastEl.offsetHeight;
-            height = bottom - top;
-          }
-          if (top !== null && height !== null && parent !== null) {
-            // cook up a div (if necessary) and position it 
-            let div = window.document.getElementById("code-annotation-line-highlight");
-            if (div === null) {
-              div = window.document.createElement("div");
-              div.setAttribute("id", "code-annotation-line-highlight");
-              div.style.position = 'absolute';
-              parent.appendChild(div);
-            }
-            div.style.top = top - 2 + "px";
-            div.style.height = height + 4 + "px";
-            div.style.left = 0;
-            let gutterDiv = window.document.getElementById("code-annotation-line-highlight-gutter");
-            if (gutterDiv === null) {
-              gutterDiv = window.document.createElement("div");
-              gutterDiv.setAttribute("id", "code-annotation-line-highlight-gutter");
-              gutterDiv.style.position = 'absolute';
-              const codeCell = window.document.getElementById(targetCell);
-              const gutter = codeCell.querySelector('.code-annotation-gutter');
-              gutter.appendChild(gutterDiv);
-            }
-            gutterDiv.style.top = top - 2 + "px";
-            gutterDiv.style.height = height + 4 + "px";
-          }
-          selectedAnnoteEl = annoteEl;
-        }
-      };
-      const unselectCodeLines = () => {
-        const elementsIds = ["code-annotation-line-highlight", "code-annotation-line-highlight-gutter"];
-        elementsIds.forEach((elId) => {
-          const div = window.document.getElementById(elId);
-          if (div) {
-            div.remove();
-          }
-        });
-        selectedAnnoteEl = undefined;
-      };
-        // Handle positioning of the toggle
-    window.addEventListener(
-      "resize",
-      throttle(() => {
-        elRect = undefined;
-        if (selectedAnnoteEl) {
-          selectCodeLines(selectedAnnoteEl);
-        }
-      }, 10)
-    );
-    function throttle(fn, ms) {
-    let throttle = false;
-    let timer;
-      return (...args) => {
-        if(!throttle) { // first call gets through
-            fn.apply(this, args);
-            throttle = true;
-        } else { // all the others get throttled
-            if(timer) clearTimeout(timer); // cancel #2
-            timer = setTimeout(() => {
-              fn.apply(this, args);
-              timer = throttle = false;
-            }, ms);
-        }
-      };
-    }
-      // Attach click handler to the DT
-      const annoteDls = window.document.querySelectorAll('dt[data-target-cell]');
-      for (const annoteDlNode of annoteDls) {
-        annoteDlNode.addEventListener('click', (event) => {
-          const clickedEl = event.target;
-          if (clickedEl !== selectedAnnoteEl) {
-            unselectCodeLines();
-            const activeEl = window.document.querySelector('dt[data-target-cell].code-annotation-active');
-            if (activeEl) {
-              activeEl.classList.remove('code-annotation-active');
-            }
-            selectCodeLines(clickedEl);
-            clickedEl.classList.add('code-annotation-active');
-          } else {
-            // Unselect the line
-            unselectCodeLines();
-            clickedEl.classList.remove('code-annotation-active');
-          }
-        });
-      }
-  const findCites = (el) => {
-    const parentEl = el.parentElement;
-    if (parentEl) {
-      const cites = parentEl.dataset.cites;
-      if (cites) {
-        return {
-          el,
-          cites: cites.split(' ')
-        };
-      } else {
-        return findCites(el.parentElement)
-      }
-    } else {
-      return undefined;
-    }
-  };
-  var bibliorefs = window.document.querySelectorAll('a[role="doc-biblioref"]');
-  for (var i=0; i<bibliorefs.length; i++) {
-    const ref = bibliorefs[i];
-    const citeInfo = findCites(ref);
-    if (citeInfo) {
-      tippyHover(citeInfo.el, function() {
-        var popup = window.document.createElement('div');
-        citeInfo.cites.forEach(function(cite) {
-          var citeDiv = window.document.createElement('div');
-          citeDiv.classList.add('hanging-indent');
-          citeDiv.classList.add('csl-entry');
-          var biblioDiv = window.document.getElementById('ref-' + cite);
-          if (biblioDiv) {
-            citeDiv.innerHTML = biblioDiv.innerHTML;
-          }
-          popup.appendChild(citeDiv);
-        });
-        return popup.innerHTML;
-      });
-    }
-  }
-});
-</script>
-</div> <!-- /content -->
-
-
-
-
-</body></html>
\ No newline at end of file
diff --git a/docs/VB_IntroTimeDepData_practical_files/figure-html/unnamed-chunk-10-1.png b/docs/VB_IntroTimeDepData_practical_files/figure-html/unnamed-chunk-10-1.png
deleted file mode 100644
index 92d91fb..0000000
Binary files a/docs/VB_IntroTimeDepData_practical_files/figure-html/unnamed-chunk-10-1.png and /dev/null differ
diff --git a/docs/VB_IntroTimeDepData_practical_files/figure-html/unnamed-chunk-11-1.png b/docs/VB_IntroTimeDepData_practical_files/figure-html/unnamed-chunk-11-1.png
deleted file mode 100644
index 021a990..0000000
Binary files a/docs/VB_IntroTimeDepData_practical_files/figure-html/unnamed-chunk-11-1.png and /dev/null differ
diff --git a/docs/VB_IntroTimeDepData_practical_files/figure-html/unnamed-chunk-12-1.png b/docs/VB_IntroTimeDepData_practical_files/figure-html/unnamed-chunk-12-1.png
deleted file mode 100644
index d0e16aa..0000000
Binary files a/docs/VB_IntroTimeDepData_practical_files/figure-html/unnamed-chunk-12-1.png and /dev/null differ
diff --git a/docs/VB_IntroTimeDepData_practical_files/figure-html/unnamed-chunk-3-1.png b/docs/VB_IntroTimeDepData_practical_files/figure-html/unnamed-chunk-3-1.png
deleted file mode 100644
index a1b87b6..0000000
Binary files a/docs/VB_IntroTimeDepData_practical_files/figure-html/unnamed-chunk-3-1.png and /dev/null differ
diff --git a/docs/VB_IntroTimeDepData_practical_files/figure-html/unnamed-chunk-4-1.png b/docs/VB_IntroTimeDepData_practical_files/figure-html/unnamed-chunk-4-1.png
deleted file mode 100644
index 4c166ec..0000000
Binary files a/docs/VB_IntroTimeDepData_practical_files/figure-html/unnamed-chunk-4-1.png and /dev/null differ
diff --git a/docs/VB_RegDiagTrans.html b/docs/VB_RegDiagTrans.html
index 8140768..a8c26d4 100644
--- a/docs/VB_RegDiagTrans.html
+++ b/docs/VB_RegDiagTrans.html
@@ -11,7 +11,7 @@
   <meta name="generator" content="quarto-1.4.552">
 
   <meta name="author" content="The VectorByte Team (Leah R. Johnson, Virginia Tech)">
-  <title>VectorByte Training 2024 - VectorByte Methods Training</title>
+  <title>VectorByte Training 2024 - Review of Diagnostics and Transformations for Regression Models</title>
   <meta name="apple-mobile-web-app-capable" content="yes">
   <meta name="apple-mobile-web-app-status-bar-style" content="black-translucent">
   <meta name="viewport" content="width=device-width, initial-scale=1.0, maximum-scale=1.0, user-scalable=no, minimal-ui">
@@ -391,8 +391,8 @@
     <div class="slides">
 
 <section id="title-slide" data-background-image="VectorByte-logo_lg.png" data-background-opacity="0.2" data-background-size="contain" class="quarto-title-block center">
-  <h1 class="title">VectorByte Methods Training</h1>
-  <p class="subtitle">Review of Diagnostics and Transformations for Regression Models</p>
+  <h1 class="title">Review of Diagnostics and Transformations for Regression Models</h1>
+  <p class="subtitle">VectorByte Methods Training</p>
 
 <div class="quarto-title-authors">
 <div class="quarto-title-author">
diff --git a/docs/VB_RegDiagTrans_files/figure-revealjs/unnamed-chunk-15-1.png b/docs/VB_RegDiagTrans_files/figure-revealjs/unnamed-chunk-15-1.png
index c66cd13..1ca3a45 100644
Binary files a/docs/VB_RegDiagTrans_files/figure-revealjs/unnamed-chunk-15-1.png and b/docs/VB_RegDiagTrans_files/figure-revealjs/unnamed-chunk-15-1.png differ
diff --git a/docs/VB_RegDiagTrans_files/figure-revealjs/unnamed-chunk-19-1.png b/docs/VB_RegDiagTrans_files/figure-revealjs/unnamed-chunk-19-1.png
index 80391b8..6d6fb87 100644
Binary files a/docs/VB_RegDiagTrans_files/figure-revealjs/unnamed-chunk-19-1.png and b/docs/VB_RegDiagTrans_files/figure-revealjs/unnamed-chunk-19-1.png differ
diff --git a/docs/VB_RegDiagTrans_files/figure-revealjs/unnamed-chunk-20-1.png b/docs/VB_RegDiagTrans_files/figure-revealjs/unnamed-chunk-20-1.png
index 0c0f7b9..be08848 100644
Binary files a/docs/VB_RegDiagTrans_files/figure-revealjs/unnamed-chunk-20-1.png and b/docs/VB_RegDiagTrans_files/figure-revealjs/unnamed-chunk-20-1.png differ
diff --git a/docs/VB_RegDiagTrans_files/figure-revealjs/unnamed-chunk-7-1.png b/docs/VB_RegDiagTrans_files/figure-revealjs/unnamed-chunk-7-1.png
index 90582a6..d36c052 100644
Binary files a/docs/VB_RegDiagTrans_files/figure-revealjs/unnamed-chunk-7-1.png and b/docs/VB_RegDiagTrans_files/figure-revealjs/unnamed-chunk-7-1.png differ
diff --git a/docs/VB_RegDiagTrans_practical.html b/docs/VB_RegDiagTrans_practical.html
index 69d4966..0238dc0 100644
--- a/docs/VB_RegDiagTrans_practical.html
+++ b/docs/VB_RegDiagTrans_practical.html
@@ -6,9 +6,10 @@
 
 <meta name="viewport" content="width=device-width, initial-scale=1.0, user-scalable=yes">
 
-<meta name="author" content="The VectorByte Team (Leah R. Johnson, Virginia Tech)">
+<meta name="author" content="Leah R. Johnson">
+<meta name="dcterms.date" content="2024-07-01">
 
-<title>VectorByte Training 2024 - VectorByte Methods Training</title>
+<title>VectorByte Training 2024 - VectorByte Methods Training: Regression Diagnostics and Transformations (practical)</title>
 <style>
 code{white-space: pre-wrap;}
 span.smallcaps{font-variant: small-caps;}
@@ -231,21 +232,33 @@ <h2 id="toc-title">On this page</h2>
 
 <header id="title-block-header" class="quarto-title-block default">
 <div class="quarto-title">
-<h1 class="title">VectorByte Methods Training</h1>
-<p class="subtitle lead">Practical: Diagnostics and Transformations</p>
+<h1 class="title">VectorByte Methods Training: Regression Diagnostics and Transformations (practical)</h1>
 </div>
 
 
+<div class="quarto-title-meta-author">
+  <div class="quarto-title-meta-heading">Author</div>
+  <div class="quarto-title-meta-heading">Affiliation</div>
+  
+    <div class="quarto-title-meta-contents">
+    <p class="author"><a href="https://lrjohnson0.github.io/QEDLab/leahJ.html">Leah R. Johnson</a> </p>
+  </div>
+  <div class="quarto-title-meta-contents">
+        <p class="affiliation">
+            Virginia Tech and VectorByte
+          </p>
+      </div>
+  </div>
 
 <div class="quarto-title-meta">
 
+      
     <div>
-    <div class="quarto-title-meta-heading">Author</div>
+    <div class="quarto-title-meta-heading">Published</div>
     <div class="quarto-title-meta-contents">
-             <p>The VectorByte Team (Leah R. Johnson, Virginia Tech) </p>
-          </div>
+      <p class="date">July 1, 2024</p>
+    </div>
   </div>
-    
   
     
   </div>
@@ -396,7 +409,17 @@ <h2 class="anchored" data-anchor-id="your-turn">Your Turn!</h2>
 </section>
 </section>
 
-</main> <!-- /main -->
+<div id="quarto-appendix" class="default"><section class="quarto-appendix-contents" id="quarto-citation"><h2 class="anchored quarto-appendix-heading">Citation</h2><div><div class="quarto-appendix-secondary-label">BibTeX citation:</div><pre class="sourceCode code-with-copy quarto-appendix-bibtex"><code class="sourceCode bibtex">@online{r. johnson2024,
+  author = {R. Johnson, Leah},
+  title = {VectorByte {Methods} {Training:} {Regression} {Diagnostics}
+    and {Transformations} (Practical)},
+  date = {2024-07-01},
+  langid = {en}
+}
+</code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre><div class="quarto-appendix-secondary-label">For attribution, please cite this work as:</div><div id="ref-r. johnson2024" class="csl-entry quarto-appendix-citeas" role="listitem">
+R. Johnson, Leah. 2024. <span>“VectorByte Methods Training: Regression
+Diagnostics and Transformations (Practical).”</span> July 1, 2024.
+</div></div></section></div></main> <!-- /main -->
 <script id="quarto-html-after-body" type="application/javascript">
 window.document.addEventListener("DOMContentLoaded", function (event) {
   const toggleBodyColorMode = (bsSheetEl) => {
diff --git a/docs/VB_RegRev.html b/docs/VB_RegRev.html
index 10645fb..e4e55a2 100644
--- a/docs/VB_RegRev.html
+++ b/docs/VB_RegRev.html
@@ -6,9 +6,10 @@
 
 <meta name="viewport" content="width=device-width, initial-scale=1.0, user-scalable=yes">
 
-<meta name="author" content="The VectorByte Team (Leah R. Johnson, Virginia Tech)">
+<meta name="author" content="Leah R. Johnson">
+<meta name="dcterms.date" content="2024-07-01">
 
-<title>VectorByte Training 2024 - VectorByte Methods Training</title>
+<title>VectorByte Training 2024 - VectorByte Methods Training: Regression Review</title>
 <style>
 code{white-space: pre-wrap;}
 span.smallcaps{font-variant: small-caps;}
@@ -214,21 +215,33 @@ <h2 id="toc-title">On this page</h2>
 
 <header id="title-block-header" class="quarto-title-block default">
 <div class="quarto-title">
-<h1 class="title">VectorByte Methods Training</h1>
-<p class="subtitle lead">Regression Review</p>
+<h1 class="title">VectorByte Methods Training: Regression Review</h1>
 </div>
 
 
+<div class="quarto-title-meta-author">
+  <div class="quarto-title-meta-heading">Author</div>
+  <div class="quarto-title-meta-heading">Affiliation</div>
+  
+    <div class="quarto-title-meta-contents">
+    <p class="author"><a href="https://lrjohnson0.github.io/QEDLab/leahJ.html">Leah R. Johnson</a> </p>
+  </div>
+  <div class="quarto-title-meta-contents">
+        <p class="affiliation">
+            Virginia Tech and VectorByte
+          </p>
+      </div>
+  </div>
 
 <div class="quarto-title-meta">
 
+      
     <div>
-    <div class="quarto-title-meta-heading">Author</div>
+    <div class="quarto-title-meta-heading">Published</div>
     <div class="quarto-title-meta-contents">
-             <p>The VectorByte Team (Leah R. Johnson, Virginia Tech) </p>
-          </div>
+      <p class="date">July 1, 2024</p>
+    </div>
   </div>
-    
   
     
   </div>
@@ -830,7 +843,16 @@ <h1>Forecasting</h1>
 
 </section>
 
-</main> <!-- /main -->
+<div id="quarto-appendix" class="default"><section class="quarto-appendix-contents" id="quarto-citation"><h2 class="anchored quarto-appendix-heading">Citation</h2><div><div class="quarto-appendix-secondary-label">BibTeX citation:</div><pre class="sourceCode code-with-copy quarto-appendix-bibtex"><code class="sourceCode bibtex">@online{r. johnson2024,
+  author = {R. Johnson, Leah},
+  title = {VectorByte {Methods} {Training:} {Regression} {Review}},
+  date = {2024-07-01},
+  langid = {en}
+}
+</code><button title="Copy to Clipboard" class="code-copy-button"><i class="bi"></i></button></pre><div class="quarto-appendix-secondary-label">For attribution, please cite this work as:</div><div id="ref-r. johnson2024" class="csl-entry quarto-appendix-citeas" role="listitem">
+R. Johnson, Leah. 2024. <span>“VectorByte Methods Training: Regression
+Review.”</span> July 1, 2024.
+</div></div></section></div></main> <!-- /main -->
 <script id="quarto-html-after-body" type="application/javascript">
 window.document.addEventListener("DOMContentLoaded", function (event) {
   const toggleBodyColorMode = (bsSheetEl) => {
diff --git a/docs/VB_TimeDepData.html b/docs/VB_TimeDepData.html
index dfe9ced..e85e598 100644
--- a/docs/VB_TimeDepData.html
+++ b/docs/VB_TimeDepData.html
@@ -11,7 +11,7 @@
   <meta name="generator" content="quarto-1.4.552">
 
   <meta name="author" content="The VectorByte Team (Leah R. Johnson, Virginia Tech)">
-  <title>VectorByte Training 2024 - VectorByte Methods Training</title>
+  <title>VectorByte Training 2024 - Regression Methods for Time Dependent Data</title>
   <meta name="apple-mobile-web-app-capable" content="yes">
   <meta name="apple-mobile-web-app-status-bar-style" content="black-translucent">
   <meta name="viewport" content="width=device-width, initial-scale=1.0, maximum-scale=1.0, user-scalable=no, minimal-ui">
@@ -391,8 +391,8 @@
     <div class="slides">
 
 <section id="title-slide" data-background-image="VectorByte-logo_lg.png" data-background-opacity="0.2" data-background-size="contain" class="quarto-title-block center">
-  <h1 class="title">VectorByte Methods Training</h1>
-  <p class="subtitle">Regression Methods for Time Dependent Data</p>
+  <h1 class="title">Regression Methods for Time Dependent Data</h1>
+  <p class="subtitle">VectorByte Methods Training</p>
 
 <div class="quarto-title-authors">
 <div class="quarto-title-author">
diff --git a/docs/materials_temp.html b/docs/materials_temp.html
index 8618a26..688c5ac 100644
--- a/docs/materials_temp.html
+++ b/docs/materials_temp.html
@@ -218,8 +218,8 @@ <h2 class="anchored" data-anchor-id="regression-in-r-refresher-transformations-a
 <section id="time-dependent-regression-analysis" class="level2">
 <h2 class="anchored" data-anchor-id="time-dependent-regression-analysis">Time dependent regression analysis</h2>
 <ul>
-<li><a href="./VB_IntroTimeDepData.html">Lecture Slides</a></li>
-<li><a href="./VB_IntroTimeDepData_practical.html">Practical</a></li>
+<li><a href="./VB_TimeDepData.html">Lecture Slides</a></li>
+<li><a href="./VB_TimeDepData_practical.html">Practical</a></li>
 <li>Dataset: <a href="./data/Culex_erraticus_walton_covariates_aggregated.csv">Walton Co, FL Mosquito data</a></li>
 </ul>
 <p><br> <br></p>
@@ -227,8 +227,9 @@ <h2 class="anchored" data-anchor-id="time-dependent-regression-analysis">Time de
 <section id="basics-of-time-series-using-r" class="level2">
 <h2 class="anchored" data-anchor-id="basics-of-time-series-using-r">Basics of Time Series using R</h2>
 <ul>
-<li><a href="">Integrated Lecture and Activities (coming soon)</a></li>
-<li>Dataset: <a href="">coming soon</a></li>
+<li><a href="">Lecture(coming soon)</a></li>
+<li><a href="">Practical(coming soon)</a></li>
+<li>Datasets: <a href="">coming soon</a></li>
 </ul>
 <p><br> <br></p>
 </section>
@@ -244,9 +245,9 @@ <h2 class="anchored" data-anchor-id="introduction-to-the-vecdyn-database">Introd
 <section id="gaussian-process-models-gps-for-time-dependent-data" class="level2">
 <h2 class="anchored" data-anchor-id="gaussian-process-models-gps-for-time-dependent-data">Gaussian Process models (GPs) for Time Dependent Data</h2>
 <ul>
-<li><a href="">Lecture Slides (coming soon)</a></li>
-<li><a href="">Lecture Note (coming soon)</a></li>
-<li><a href="">Practical (coming soon)</a></li>
+<li><a href="./GP.html">Lecture Slides</a></li>
+<li><a href="./GP_Notes.html">Lecture Notes</a></li>
+<li><a href="./GP_Practical.html">Practical</a></li>
 </ul>
 <p><br> <br></p>
 
diff --git a/docs/search.json b/docs/search.json
index f2dc71e..2b11c1f 100644
--- a/docs/search.json
+++ b/docs/search.json
@@ -186,7 +186,7 @@
     "href": "materials_temp.html#basics-of-time-series-using-r",
     "title": "VectorByte Training Materials 2024",
     "section": "Basics of Time Series using R",
-    "text": "Basics of Time Series using R\n\nIntegrated Lecture and Activities (coming soon)\nDataset: coming soon"
+    "text": "Basics of Time Series using R\n\nLecture(coming soon)\nPractical(coming soon)\nDatasets: coming soon"
   },
   {
     "objectID": "materials_temp.html#introduction-to-the-vecdyn-database",
@@ -200,7 +200,7 @@
     "href": "materials_temp.html#gaussian-process-models-gps-for-time-dependent-data",
     "title": "VectorByte Training Materials 2024",
     "section": "Gaussian Process models (GPs) for Time Dependent Data",
-    "text": "Gaussian Process models (GPs) for Time Dependent Data\n\nLecture Slides (coming soon)\nLecture Note (coming soon)\nPractical (coming soon)"
+    "text": "Gaussian Process models (GPs) for Time Dependent Data\n\nLecture Slides\nLecture Notes\nPractical"
   },
   {
     "objectID": "index.html",
@@ -210,892 +210,843 @@
     "text": "Check out our about and schedule: coming soon! pages to continue.\nInformation about pre-workshop preparation – including software installation, expectations for what you should already be familiar with, and review materials – is available in the pre-work portion of the materials page."
   },
   {
-    "objectID": "VB_RegDiagTrans.html#learning-objectives",
-    "href": "VB_RegDiagTrans.html#learning-objectives",
-    "title": "VectorByte Methods Training",
-    "section": "Learning Objectives",
-    "text": "Learning Objectives\n\nReview assumptions of SLR/MLR models\nReview using diagnostic plots to assess whether assumptions are met\nReview the idea of basic transformations to use when assumptions aren’t met"
-  },
-  {
-    "objectID": "VB_RegDiagTrans.html#slr-model-assumptions",
-    "href": "VB_RegDiagTrans.html#slr-model-assumptions",
-    "title": "VectorByte Methods Training",
-    "section": "SLR model assumptions",
-    "text": "SLR model assumptions\n\\[\nY_i |X_i \\stackrel{ind}{\\sim} \\mathcal{N}(\\beta_0 + \\beta_1 X_i, \\sigma^2)\n\\]\nRecall the key assumptions of the Simple Linear Regression model:\n\nThe conditional mean of \\(Y\\) is linear in \\(X\\).\nThe additive errors (deviations from line)\n\nare normally distributed\nindependent from each other\nidentically distributed (i.e., they have constant variance)"
-  },
-  {
-    "objectID": "VB_RegDiagTrans.html#example-model-violations",
-    "href": "VB_RegDiagTrans.html#example-model-violations",
-    "title": "VectorByte Methods Training",
-    "section": "Example model violations",
-    "text": "Example model violations\nAnscombe’s quartet comprises four datasets that have similar statistical properties …\n\n\n\n\nXmean\nYmean\nXsd\nYsd\nXYcor\n\n\n\n\n1\n9.000\n7.501\n3.317\n2.032\n0.816\n\n\n2\n9.000\n7.501\n3.317\n2.032\n0.816\n\n\n3\n9.000\n7.500\n3.317\n2.030\n0.816\n\n\n4\n9.000\n7.501\n3.317\n2.031\n0.817"
-  },
-  {
-    "objectID": "VB_RegDiagTrans.html#residuals-and-the-model-assumptions",
-    "href": "VB_RegDiagTrans.html#residuals-and-the-model-assumptions",
-    "title": "VectorByte Methods Training",
-    "section": "Residuals and the model assumptions",
-    "text": "Residuals and the model assumptions\nRecall that the linear regression model assumes \\[\nY_i =\\beta_0 + \\beta_1 X_i + \\varepsilon_i,~~\\mbox{where}~~\n\\varepsilon_i \\stackrel{iid}{\\sim} \\mathcal{N}(0,\\sigma^2).\n\\]\nOur goal is to determine if the “true” residuals are iid normal and unrelated to \\(X\\). If the SLR model assumptions are true, then the residuals must be just “white noise”:\n\nEach \\(\\varepsilon_i\\) has the same variance (\\(\\sigma^2\\)).\nEach \\(\\varepsilon_i\\) has the same mean (0).\nAll of the \\(\\varepsilon_i\\) have the same normal distribution."
-  },
-  {
-    "objectID": "VB_RegDiagTrans.html#understanding-leverage",
-    "href": "VB_RegDiagTrans.html#understanding-leverage",
-    "title": "VectorByte Methods Training",
-    "section": "Understanding Leverage",
-    "text": "Understanding Leverage\nThe \\(h_i\\) leverage term measures sensitivity of the estimated least squares regression line to changes in \\(Y_i\\).\nThe term “leverage” provides a mechanical intuition:\n\nThe farther you are from a pivot joint, the more torque you have pulling on a lever.\n\nHere is a nice online (interactive) illustration of leverage:\n\nhttps://omaymas.shinyapps.io/Influence_Analysis/\n\n\nOutliers do more damage if they have high leverage!"
-  },
-  {
-    "objectID": "VB_RegDiagTrans.html#standardized-residuals",
-    "href": "VB_RegDiagTrans.html#standardized-residuals",
-    "title": "VectorByte Methods Training",
-    "section": "Standardized residuals",
-    "text": "Standardized residuals\nSince \\(e_i \\sim N(0, \\sigma^2 [1-h_i])\\), we know that \\[\n\\color{red}{\\frac{e_i}{\\sigma \\sqrt{1-h_i} }\\sim N(0, 1)}.\n\\]\nThese transformed \\(e_i\\)’s are called the standardized residuals.\n\nThey all have the same distribution if the SLR model assumptions are true.\nThey are almost (close enough) independent (\\(\\stackrel{iid}{\\sim}N(0,1)\\)).\nEstimate \\(\\sigma^2 \\approx s^2 = \\frac{1}{n-p}\\sum_{j=1}^n e_j^2\\). (\\(p=2\\) for SLR)"
-  },
-  {
-    "objectID": "VB_RegDiagTrans.html#studentized-residuals",
-    "href": "VB_RegDiagTrans.html#studentized-residuals",
-    "title": "VectorByte Methods Training",
-    "section": "Studentized residuals",
-    "text": "Studentized residuals\nWe thus define a standard Studentized residual as \\[\nr_i = \\frac{e_i}{s_{-i} \\sqrt{1-h_i} }\\sim t_{n-p-1}(0, 1)\n\\] where \\(s_{-i}^2 = \\frac{1}{n-p-1}\\sum_{j \\neq i} e_j^2\\) is \\(\\hat{\\sigma~}^2\\) calculated without \\(e_i\\).\n\nThese are easy to get in R with the rstudent() function:\n\nas.numeric(rstudent(reg3))\n#&gt;  [1]   -0.43905545   -0.18550224 1203.53946383   -0.31384418   -0.57429485\n#&gt;  [6]   -1.15598185    0.06640743    0.36185145   -0.73567703   -0.06576806\n#&gt; [11]    0.20026336"
-  },
-  {
-    "objectID": "VB_RegDiagTrans.html#outliers-and-studentized-residuals",
-    "href": "VB_RegDiagTrans.html#outliers-and-studentized-residuals",
-    "title": "VectorByte Methods Training",
-    "section": "Outliers and Studentized residuals",
-    "text": "Outliers and Studentized residuals\nSince the studentized residuals are distributed \\(t_{n-p-1}(0,1)\\), we should be concerned about any \\(r_i\\) outside of about \\([-2.5, 2.5]\\).\n\n (Note: As \\(n\\) gets much bigger, we will expect to see some very rare events (big $\u000barepsilon_i$) and not get worried unless \\(|r_i| &gt; 3\\) or \\(4\\).)"
-  },
-  {
-    "objectID": "VB_RegDiagTrans.html#how-to-deal-with-outliers",
-    "href": "VB_RegDiagTrans.html#how-to-deal-with-outliers",
-    "title": "VectorByte Methods Training",
-    "section": "How to deal with outliers",
-    "text": "How to deal with outliers\n\n\n\n\nfrom Research Wahlberg"
-  },
-  {
-    "objectID": "VB_RegDiagTrans.html#how-to-deal-with-outliers-1",
-    "href": "VB_RegDiagTrans.html#how-to-deal-with-outliers-1",
-    "title": "VectorByte Methods Training",
-    "section": "How to deal with outliers",
-    "text": "How to deal with outliers\nWhen should you delete outliers?\n\nOnly when you have a really good reason!\n\nThere is nothing wrong with running a regression with and without potential outliers to see whether results are significantly impacted.\nAny time outliers are dropped, the reasons for doing so should be clearly noted.\n\nI maintain that both a statistical and a non-statistical reason are required."
-  },
-  {
-    "objectID": "VB_RegDiagTrans.html#outliers-leverage-and-residuals",
-    "href": "VB_RegDiagTrans.html#outliers-leverage-and-residuals",
-    "title": "VectorByte Methods Training",
-    "section": "Outliers, leverage, and residuals",
-    "text": "Outliers, leverage, and residuals\nWarning: Unfortunately, outliers with high leverage are hard to catch through \\(\\color{dodgerblue}{r_i}\\) (since the line is pulled towards them).\nMeans get distracted by outliers…"
+    "objectID": "VB_TimeDepData_practical.html#exploring-the-data",
+    "href": "VB_TimeDepData_practical.html#exploring-the-data",
+    "title": "VectorByte Methods Training: Regression Methods for Time Dependent Data (practical)",
+    "section": "Exploring the Data",
+    "text": "Exploring the Data\nAs always, we first want to take a look at the data, to make sure we understand it, and that we don’t have missing or weird values.\n\nmozData&lt;-read.csv(\"data/Culex_erraticus_walton_covariates_aggregated.csv\")\nsummary(mozData)\n\n   Month_Yr          sample_value        MaxTemp          Precip      \n Length:36          Min.   :0.00000   Min.   :16.02   Min.   : 0.000  \n Class :character   1st Qu.:0.04318   1st Qu.:22.99   1st Qu.: 2.162  \n Mode  :character   Median :0.73001   Median :26.69   Median : 4.606  \n                    Mean   :0.80798   Mean   :26.23   Mean   : 5.595  \n                    3rd Qu.:1.22443   3rd Qu.:30.70   3rd Qu.: 7.864  \n                    Max.   :3.00595   Max.   :33.31   Max.   :18.307  \n\n\nWe can see that the minimum observed average number of mosquitoes it zero, and max is only 3 (there are likely many zeros averaged over many days in the month). There don’t appear to be any NAs in the data. In this case the dataset itself is small enough that we can print the whole thing to ensure it’s complete:\n\nmozData\n\n   Month_Yr sample_value  MaxTemp       Precip\n1   2015-01  0.000000000 17.74602  3.303991888\n2   2015-02  0.018181818 17.87269 16.544265802\n3   2015-03  0.468085106 23.81767  2.405651215\n4   2015-04  1.619047619 26.03559  8.974406168\n5   2015-05  0.821428571 30.01602  0.567960943\n6   2015-06  3.005952381 31.12094  4.841342729\n7   2015-07  2.380952381 32.81130  3.849010353\n8   2015-08  1.826347305 32.56245  5.562845324\n9   2015-09  0.648809524 30.55155 10.409724627\n10  2015-10  0.988023952 27.22605  0.337750269\n11  2015-11  0.737804878 24.86768 18.306749680\n12  2015-12  0.142857143 22.46588  5.621475377\n13  2016-01  0.000000000 16.02406  3.550622029\n14  2016-02  0.020202020 19.42057 11.254680803\n15  2016-03  0.015151515 23.13610  4.785664728\n16  2016-04  0.026143791 24.98082  4.580424519\n17  2016-05  0.025252525 28.72884  0.053057634\n18  2016-06  0.833333333 30.96990  6.155417473\n19  2016-07  1.261363636 33.30509  4.496368193\n20  2016-08  1.685279188 32.09633 11.338749182\n21  2016-09  2.617142857 31.60575  2.868288451\n22  2016-10  1.212121212 29.14275  0.000000000\n23  2016-11  1.539772727 24.48482  0.005462681\n24  2016-12  0.771573604 20.46054 11.615521725\n25  2017-01  0.045454545 18.35473  0.000000000\n26  2017-02  0.036363636 23.65584  3.150710053\n27  2017-03  0.194285714 22.53573  1.430094952\n28  2017-04  0.436548223 26.15299  0.499381616\n29  2017-05  1.202020202 28.00173  6.580562663\n30  2017-06  0.834196891 29.48951 13.333939858\n31  2017-07  1.765363128 32.25135  7.493927035\n32  2017-08  0.744791667 31.86476  6.082113434\n33  2017-09  0.722222222 30.60566  4.631037395\n34  2017-10  0.142131980 27.73453 11.567112214\n35  2017-11  0.289772727 23.23140  1.195760473\n36  2017-12  0.009174312 18.93603  4.018254442"
   },
   {
-    "objectID": "VB_RegDiagTrans.html#outliers-leverage-and-residuals-1",
-    "href": "VB_RegDiagTrans.html#outliers-leverage-and-residuals-1",
-    "title": "VectorByte Methods Training",
-    "section": "Outliers, leverage, and residuals",
-    "text": "Outliers, leverage, and residuals\nWarning: Unfortunately, outliers with high leverage are hard to catch through \\(\\color{dodgerblue}{r_i}\\) (since the line is pulled towards them).\nConsider data on house Rents vs SqFt:\n\nPlots of \\(r_i\\) or \\(e_i\\) against \\(\\hat{Y~}_i\\) or \\(X_i\\) are still your best diagnostic!"
+    "objectID": "VB_TimeDepData_practical.html#plotting-the-data",
+    "href": "VB_TimeDepData_practical.html#plotting-the-data",
+    "title": "VectorByte Methods Training: Regression Methods for Time Dependent Data (practical)",
+    "section": "Plotting the data",
+    "text": "Plotting the data\nFirst we’ll examine the data itself, including the predictors:\n\nmonths&lt;-dim(mozData)[1]\nt&lt;-1:months ## counter for months in the data set\npar(mfrow=c(3,1))\nplot(t, mozData$sample_value, type=\"l\", lwd=2, \n     main=\"Average Monthly Abundance\", \n     xlab =\"Time (months)\", \n     ylab = \"Average Count\")\nplot(t, mozData$MaxTemp, type=\"l\",\n     col = 2, lwd=2, \n     main=\"Average Maximum Temp\", \n     xlab =\"Time (months)\", \n     ylab = \"Temperature (C)\")\nplot(t, mozData$Precip, type=\"l\",\n     col=\"dodgerblue\", lwd=2,\n     main=\"Average Monthly Precip\", \n     xlab =\"Time (months)\", \n     ylab = \"Precipitation (in)\")\n\n\n\n\n\n\n\n\nVisually we noticed that there may be a bit of clumping in the values for abundance (this is subtle) – in particular, since we have a lot of very small/nearly zero counts, a transform, such as a square root, may spread things out for the abundances. It also looks like both the abundance and temperature data are more cyclical than the precipitation, and thus more likely to be related to each other. There’s also not visually a lot of indication of a trend, but it’s usually worthwhile to consider it anyway. Replotting the abundance data with a transformation:\n\nmonths&lt;-dim(mozData)[1]\nt&lt;-1:months ## counter for months in the data set\nplot(t, sqrt(mozData$sample_value), type=\"l\", lwd=2, \n     main=\"Sqrt Average Monthly Abundance\", \n     xlab =\"Time (months)\", \n     ylab = \"Average Count\")\n\n\n\n\n\n\n\n\nThat looks a little bit better. I suggest we go with this for our response."
   },
   {
-    "objectID": "VB_RegDiagTrans.html#normality-and-studentized-residuals",
-    "href": "VB_RegDiagTrans.html#normality-and-studentized-residuals",
-    "title": "VectorByte Methods Training",
-    "section": "Normality and studentized residuals",
-    "text": "Normality and studentized residuals\nA more subtle issue is the normality of the distribution on \\(\\varepsilon\\).\n\nWe can look at the residuals to judge normality if \\(n\\) is big enough (say \\(&gt;20~~ \\rightarrow\\) less than that makes it too hard to call).\n\nIn particular, if we have decent size \\(\\color{red}{n}\\), we want the shape of the studentized residual distribution to “look” like \\(\\color{red}{N(0,1)}\\).\n The most obvious tactic is to look at a histogram of \\(r_i\\)."
+    "objectID": "VB_TimeDepData_practical.html#building-a-data-frame",
+    "href": "VB_TimeDepData_practical.html#building-a-data-frame",
+    "title": "VectorByte Methods Training: Regression Methods for Time Dependent Data (practical)",
+    "section": "Building a data frame",
+    "text": "Building a data frame\nBefore we get into model building, we always want to build a data frame to contain all of the predictors that we want to consider, at the potential lags that we’re interested in. In the lecture we saw building the AR, sine/cosine, and trend predictors:\n\nt &lt;- 2:months ## to make building the AR1 predictors easier\n\nmozTS &lt;- data.frame(\n  Y=sqrt(mozData$sample_value[t]), # transformed response\n  Yl1=sqrt(mozData$sample_value[t-1]), # AR1 predictor\n  t=t, # trend predictor\n  sin12=sin(2*pi*t/12), \n  cos12=cos(2*pi*t/12) # periodic predictors\n  )\n\nWe will also put in the temperature and precipitation predictors. But we need to think about what might be an appropriate lag. If this were daily or weekly data, we’d probably want to have a fairly sizable lag – mosquitoes take a while to develop, so the number we see today is not likely related to the temperature today. However, since these data are agregated across a whole month, as is the temperature/precipitaion, the current month values are likely to be useful. However, it’s even possible that last month’s values may be so we’ll add those in as well:\n\nmozTS$MaxTemp&lt;-mozData$MaxTemp[t] ## current temps\nmozTS$MaxTempl1&lt;-mozData$MaxTemp[t-1] ## previous temps\nmozTS$Precip&lt;-mozData$Precip[t] ## current precip\nmozTS$Precipl1&lt;-mozData$Precip[t-1] ## previous precip\n\nThus our full dataframe:\n\nsummary(mozTS)\n\n       Y               Yl1               t            sin12         \n Min.   :0.0000   Min.   :0.0000   Min.   : 2.0   Min.   :-1.00000  \n 1st Qu.:0.2951   1st Qu.:0.2951   1st Qu.:10.5   1st Qu.:-0.68301  \n Median :0.8590   Median :0.8590   Median :19.0   Median : 0.00000  \n Mean   :0.7711   Mean   :0.7684   Mean   :19.0   Mean   :-0.01429  \n 3rd Qu.:1.1120   3rd Qu.:1.1120   3rd Qu.:27.5   3rd Qu.: 0.68301  \n Max.   :1.7338   Max.   :1.7338   Max.   :36.0   Max.   : 1.00000  \n     cos12             MaxTemp        MaxTempl1         Precip      \n Min.   :-1.00000   Min.   :16.02   Min.   :16.02   Min.   : 0.000  \n 1st Qu.:-0.68301   1st Qu.:23.18   1st Qu.:23.18   1st Qu.: 1.918  \n Median : 0.00000   Median :27.23   Median :27.23   Median : 4.631  \n Mean   :-0.02474   Mean   :26.47   Mean   :26.44   Mean   : 5.660  \n 3rd Qu.: 0.50000   3rd Qu.:30.79   3rd Qu.:30.79   3rd Qu.: 8.234  \n Max.   : 1.00000   Max.   :33.31   Max.   :33.31   Max.   :18.307  \n    Precipl1     \n Min.   : 0.000  \n 1st Qu.: 1.918  \n Median : 4.631  \n Mean   : 5.640  \n 3rd Qu.: 8.234  \n Max.   :18.307  \n\n\n\nhead(mozTS)\n\n          Y       Yl1 t         sin12         cos12  MaxTemp MaxTempl1\n1 0.1348400 0.0000000 2  8.660254e-01  5.000000e-01 17.87269  17.74602\n2 0.6841675 0.1348400 3  1.000000e+00  6.123234e-17 23.81767  17.87269\n3 1.2724180 0.6841675 4  8.660254e-01 -5.000000e-01 26.03559  23.81767\n4 0.9063270 1.2724180 5  5.000000e-01 -8.660254e-01 30.01602  26.03559\n5 1.7337683 0.9063270 6  1.224647e-16 -1.000000e+00 31.12094  30.01602\n6 1.5430335 1.7337683 7 -5.000000e-01 -8.660254e-01 32.81130  31.12094\n      Precip   Precipl1\n1 16.5442658  3.3039919\n2  2.4056512 16.5442658\n3  8.9744062  2.4056512\n4  0.5679609  8.9744062\n5  4.8413427  0.5679609\n6  3.8490104  4.8413427"
   },
   {
-    "objectID": "VB_RegDiagTrans.html#assessing-normality-via-q-q-plots",
-    "href": "VB_RegDiagTrans.html#assessing-normality-via-q-q-plots",
-    "title": "VectorByte Methods Training",
-    "section": "Assessing normality via Q-Q plots",
-    "text": "Assessing normality via Q-Q plots\nHigher fidelity diagnostics are provided by normal quantile-quantile (Q-Q) plots that:\n\nplot the sample quantiles (e.g. \\(10^{th}\\) percentile, etc.)\nagainst true percentiles from a \\(N(0,1)\\) distribution (e.g. \\(-1.96\\) is the true 2.5% quantile).\n\nIf \\(r_i \\sim N(0,1)\\) these quantiles should be equal\n\nlie on a line through 0 with slope 1"
+    "objectID": "VB_TimeDepData_practical.html#building-a-first-model",
+    "href": "VB_TimeDepData_practical.html#building-a-first-model",
+    "title": "VectorByte Methods Training: Regression Methods for Time Dependent Data (practical)",
+    "section": "Building a first model",
+    "text": "Building a first model\nWe will first build a very simple model – just a trend – to practice building the model, checking diagnostics, and plotting predictions.\n\nmod1&lt;-lm(Y ~ t, data=mozTS)\nsummary(mod1)\n\n\nCall:\nlm(formula = Y ~ t, data = mozTS)\n\nResiduals:\n     Min       1Q   Median       3Q      Max \n-0.81332 -0.47902  0.03671  0.37384  0.87119 \n\nCoefficients:\n             Estimate Std. Error t value Pr(&gt;|t|)    \n(Intercept)  0.904809   0.178421   5.071  1.5e-05 ***\nt           -0.007038   0.008292  -0.849    0.402    \n---\nSignif. codes:  0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1\n\nResidual standard error: 0.4954 on 33 degrees of freedom\nMultiple R-squared:  0.02136,   Adjusted R-squared:  -0.008291 \nF-statistic: 0.7204 on 1 and 33 DF,  p-value: 0.4021\n\n\nThe model output indicates that this model is not useful – the trend is not significant and it only explains about 2% of the variability. Let’s plot the predictions:\n\n## plot points and fitted lines\nplot(Y~t, data=mozTS, col=1, type=\"l\")\nlines(t, mod1$fitted, col=\"dodgerblue\", lwd=2)\n\n\n\n\n\n\n\n\nNot good – we’ll definitely need to try something else! Remember that since we’re using a linear model for this, that we should check our residual plots as usual, and then also plot the acf of the residuals:\n\npar(mfrow=c(1,3), mar=c(4,4,2,0.5))   \n\n## studentized residuals vs fitted\nplot(mod1$fitted, rstudent(mod1), col=1,\n     xlab=\"Fitted Values\", \n     ylab=\"Studentized Residuals\", \n     pch=20, main=\"AR 1 only model\")\n\n## qq plot of studentized residuals\nqqnorm(rstudent(mod1), pch=20, col=1, main=\"\" )\nabline(a=0,b=1,lty=2, col=2)\n\n## histogram of studentized residuals\nhist(rstudent(mod1), col=1, \n     xlab=\"Studentized Residuals\", \n     main=\"\", border=8)\n\n\n\n\n\n\n\n\nThis doesn’t look really bad, although the histogram might be a bit weird. Finally the acf\n\nacf(mod1$residuals)\n\n\n\n\n\n\n\n\nThis is where we can see that we definitely aren’t able to capture the pattern. There’s substantial autocorrelation left at a 1 month lag, and around 6 months.\nFinally, for moving forward, we can extract the BIC for this model so that we can compare with other models that you’ll build next.\n\nn&lt;-length(t)\nextractAIC(mod1, k=log(n))[2]\n\n[1] -44.11057"
   },
   {
-    "objectID": "VB_RegDiagTrans.html#go-to-diagnostic-plots",
-    "href": "VB_RegDiagTrans.html#go-to-diagnostic-plots",
-    "title": "VectorByte Methods Training",
-    "section": "3 Go-To Diagnostic Plots",
-    "text": "3 Go-To Diagnostic Plots"
+    "objectID": "schedule2024.html",
+    "href": "schedule2024.html",
+    "title": "2024 Training Schedule",
+    "section": "",
+    "text": "Main materials\n\nPre-workshop\nInformation about pre-workshop preparation – including software installation, expectations for what you should already be familiar with, and review materials – is available in the pre-work portion of the materials page.\n  \n\n\n22 July 2024\n\n\n\nTime\nActivity\nMaterials\n\n\n\n\n\nArrival\n\n\n\n\n  \n\n\n23 July 2024 (08:30 - 17:30)\n\n\n\n\n\n\n\n\nTime\nActivity\nMaterials\n\n\n\n\n8:30\nIntroduction to time dependent data, course overview\n\n\n\n9:30\nGoal setting, lighting presentations\n\n\n\n10:15\nBreak\n\n\n\n10:45\nLecture: Regression Transformations and Diagnostics\n\n\n\n11:45\nPractical: Regression Transformations and Diagnostics\n\n\n\n12:30\nLunch\n\n\n\n13:30\nLecture: Time Dependent Data Analysis\n\n\n\n14:30\nPractical: Time Dependent Data Analysis\n\n\n\n15:15\nBreak\n\n\n\n15:30\nIntegrated Lecture and Practical: Basics of Time Series method\n\n\n\n\n  \n\n\n24 July 2024 (08:30 - 17:30)\n\n\n\n\n\n\n\n\nTime\nActivity\nMaterials\n\n\n\n\n8:30\nOverview of the day\n\n\n\n9:00\nIntroduction to VecDyn Database and API\n\n\n\n10:00\nBreak\n\n\n\n10:30\nWorking with VecDyn/time dependent data (data aggregation, covariate/predictor sources)\n\n\n\n12:30\nLunch\n\n\n\n13:30\nLecture: Introduction to Gaussian Process (GP) regression applied to time dependent data\n\n\n\n14:45\nBreak\n\n\n\n15:15\nPractical: GPs in R with laGP and hetGP\n\n\n\n16:30\nBrainstorming planning for projects\n\n\n\n17:00\nLightning talks\n\n\n\n\n  \n\n\n25 July 2024 (08:30 - 17:30)\n\n\n\n\n\n\n\n\nTime.\nActivity\nMaterials\n\n\n\n\n8:30\nOverview of the day\n\n\n\n9:00\nForecasting metrics and challenge introduction\n\n\n\n9:30\nForecasting Challenge\n\n\n\n10:30\nBreak\n\n\n\n11:00\nForecasting Challenge (cont)\n\n\n\n11:45\nPresent and Eval forecasts\n\n\n\n12:30\nLunch\n\n\n\n13:30\nMini projects\n\n\n\n15:00\nBreak\n\n\n\n15:30\nMini projects\n\n\n\n16:30\nPresent mini projects; wrap up\n\n\n\n\n  \n\n\n26 July 2024\n\n\n\nTime\nActivity\nMaterials\n\n\n\n\n\nTravel\n\n\n\n\n\n\nPost-workshop\nEnjoy using these new techniques and databases!"
   },
   {
-    "objectID": "VB_RegDiagTrans.html#violations-of-slr-model-assumptions",
-    "href": "VB_RegDiagTrans.html#violations-of-slr-model-assumptions",
-    "title": "VectorByte Methods Training",
-    "section": "Violations of SLR Model Assumptions",
-    "text": "Violations of SLR Model Assumptions\n\\[\\color{dodgerblue}{Y_i |X_i \\stackrel{ind}{\\sim} \\mathcal{N}(\\beta_0 + \\beta_1 X_i, \\sigma^2)}\\]\n\nThe conditional mean of \\(Y\\) is linear in \\(X\\).\nThe additive errors (deviations from line)\n\nare normally distributed\nindependent from each other\nidentically distributed (i.e., they have constant variance)\n\n\nAll of these can be violated! Let’s see what violations look like and how we can deal with them within the SLR framework."
+    "objectID": "GP_Practical.html",
+    "href": "GP_Practical.html",
+    "title": "VectorByte Methods Training: Introduction to Gaussian Processes for Time Dependent Data (Practical)",
+    "section": "",
+    "text": "This practical will lead you through fitting a few versions of GPs using two R packages: laGP and hetGP. We will begin with a toy example from the lecture and then move on to a real data example to forecast tick abundances for a NEON site."
   },
   {
-    "objectID": "VB_RegDiagTrans.html#violation-1-non-constant-variance",
-    "href": "VB_RegDiagTrans.html#violation-1-non-constant-variance",
-    "title": "VectorByte Methods Training",
-    "section": "Violation 1: Non-constant variance",
-    "text": "Violation 1: Non-constant variance\nIf you get a trumpet shape (bunching of the \\(Y\\)s), you have nonconstant variance.\n\nThis violates our assumption that all \\(\\varepsilon_i\\) have the same \\(\\sigma^2\\)."
+    "objectID": "GP_Practical.html#overview-of-the-data",
+    "href": "GP_Practical.html#overview-of-the-data",
+    "title": "VectorByte Methods Training: Introduction to Gaussian Processes for Time Dependent Data (Practical)",
+    "section": "Overview of the Data",
+    "text": "Overview of the Data\n\nObjective: Forecast tick density for 4 weeks into the future\nSites: The data is collected across 9 different sites, each plot was of size 1600m^2 using a drag cloth\nData: Sparse and irregularly spaced. We only have ~650 observations across 10 years at 9 locations\n\nLet’s start with loading all the libraries that we will need, load our data and understand what we have.\n\nlibrary(tidyverse)\nlibrary(laGP)\nlibrary(ggplot2)\n\n# Pulling the data from the NEON data base. \ntarget &lt;- readr::read_csv(\"https://data.ecoforecast.org/neon4cast-targets/ticks/ticks-targets.csv.gz\", guess_max = 1e1)\n\n# Visualizing the data\nhead(target)\n\n# A tibble: 6 × 5\n  datetime   site_id variable             observation iso_week\n  &lt;date&gt;     &lt;chr&gt;   &lt;chr&gt;                      &lt;dbl&gt; &lt;chr&gt;   \n1 2015-04-20 BLAN    amblyomma_americanum        0    2015-W17\n2 2015-05-11 BLAN    amblyomma_americanum        9.82 2015-W20\n3 2015-06-01 BLAN    amblyomma_americanum       10    2015-W23\n4 2015-06-08 BLAN    amblyomma_americanum       19.4  2015-W24\n5 2015-06-22 BLAN    amblyomma_americanum        3.14 2015-W26\n6 2015-07-13 BLAN    amblyomma_americanum        3.66 2015-W29"
   },
   {
-    "objectID": "VB_RegDiagTrans.html#solution-1-variance-stabilizing-transformations",
-    "href": "VB_RegDiagTrans.html#solution-1-variance-stabilizing-transformations",
-    "title": "VectorByte Methods Training",
-    "section": "Solution 1: Variance stabilizing transformations",
-    "text": "Solution 1: Variance stabilizing transformations\nThis is one of the most common model violations; luckily, it is usually fixable by transforming the response (\\(Y\\)) variable.\n\\(\\color{dodgerblue}{\\log(Y)}\\) is the most common variance stabilizing transform.\n\nIf \\(Y\\) has only positive values (e.g. sales) or is a count (e.g. # of customers), take \\(\\log(Y)\\) (always natural log).\n\n\\(\\color{dodgerblue}{\\sqrt{Y}}\\) is sometimes used, especially if the data have zeros.\n\nIn general, think what you expect to be linear for your data."
+    "objectID": "GP_Practical.html#initial-setup",
+    "href": "GP_Practical.html#initial-setup",
+    "title": "VectorByte Methods Training: Introduction to Gaussian Processes for Time Dependent Data (Practical)",
+    "section": "Initial Setup",
+    "text": "Initial Setup\n\nFor a GP model, we assume the response (Y) should be normally distributed.\nSince tick density, our response, must be greater than 0, we need to use a transform.\nThe following is the most suitable transform for our application:\n\n\n\\begin{equation}\n\\begin{aligned}\nf(y) \\ & = \\text{log } \\ (y + 1) \\ \\ ; \\ \\ \\ \\\\[2pt]\n&lt;!-- \\ & = \\sqrt{y} \\ \\ \\ \\; \\ \\ \\ otherwise --&gt;\n\\end{aligned}\n\\end{equation}\nWe pass in (response + 1) into this function to ensure we don’;t take a log of 0. We will adjust this in our back transform.\nLet’s write a function for this, as well as the inverse of the transform.\n\n# transforms y\nf &lt;- function(x) {\n  y &lt;- log(x + 1)\n  return(y)\n}\n\n# This function back transforms the input argument\nfi &lt;- function(y) {\n  x &lt;- exp(y) - 1\n  return(x)\n}"
   },
   {
-    "objectID": "VB_RegDiagTrans.html#violation-2-nonlinear-residual-patterns",
-    "href": "VB_RegDiagTrans.html#violation-2-nonlinear-residual-patterns",
-    "title": "VectorByte Methods Training",
-    "section": "Violation 2: Nonlinear residual patterns",
-    "text": "Violation 2: Nonlinear residual patterns\nConsider regression residuals for the 2nd Anscombe dataset:\n\nThings are not good! It appears that we do not have a linear mean function; that is \\(\\color{dodgerblue}{\\mathbb{E}[Y] \\neq \\beta_0 + \\beta_1 X}\\)."
+    "objectID": "GP_Practical.html#predictors",
+    "href": "GP_Practical.html#predictors",
+    "title": "VectorByte Methods Training: Introduction to Gaussian Processes for Time Dependent Data (Practical)",
+    "section": "Predictors",
+    "text": "Predictors\n\nThe goal is to forecast tick populations for a season so our response (Y) here, is the tick density. However, we do not have a traditional data set with an obvious input space. What is the X? \n\nWe made a few plots earlier to help us identify what can be useful:\n\nX_1 Iso-week: This is the iso-week number\nLet’s convert the iso-week from our target dataset as a numeric i.e. a number. Here is a function to do the same.\n\n# This function tells us the iso-week number given the date\nfx.iso_week &lt;- function(datetime){\n  # Gives ISO-week in the format yyyy-w## and we extract the ##\n  x1 &lt;- as.numeric(stringr::str_sub(ISOweek::ISOweek(datetime), 7, 8)) # find iso week #\n  return(x1)\n}\n\ntarget$week &lt;- fx.iso_week(target$datetime)\nhead(target)\n\n# A tibble: 6 × 6\n  datetime   site_id variable             observation iso_week  week\n  &lt;date&gt;     &lt;chr&gt;   &lt;chr&gt;                      &lt;dbl&gt; &lt;chr&gt;    &lt;dbl&gt;\n1 2015-04-20 BLAN    amblyomma_americanum        0    2015-W17    17\n2 2015-05-11 BLAN    amblyomma_americanum        9.82 2015-W20    20\n3 2015-06-01 BLAN    amblyomma_americanum       10    2015-W23    23\n4 2015-06-08 BLAN    amblyomma_americanum       19.4  2015-W24    24\n5 2015-06-22 BLAN    amblyomma_americanum        3.14 2015-W26    26\n6 2015-07-13 BLAN    amblyomma_americanum        3.66 2015-W29    29\n\n\n\nX_2 Sine wave: We use this to give our model phases. We can consider this as a proxy to some other variables such as temperature which would increase from Jan to about Jun-July and then decrease. We use the following sin wave\n\nX_2 = \\left( \\text{sin} \\ \\left( \\frac{2 \\ \\pi \\ X_1}{106} \\right) \\right)^2 where, X_1 is the iso-week.\nUsually, a Sin wave for a year would have the periodicity of 53 to indicate 53 weeks. Why have we chosen 106 as our period? And we do we square it?\nLet’s use a visual to understand that.\n\nx &lt;- c(1:106)\nsin_53 &lt;- sin(2*pi*x/53)\nsin_106 &lt;- (sin(2*pi*x/106))\nsin_106_2 &lt;- (sin(2*pi*x/106))^2\n\npar(mfrow=c(1, 3), mar = c(4, 5, 4, 1), cex.axis = 2, cex.lab = 2, cex.main = 3, font.lab = 2)\nplot(x, sin_53, col = 2, pch = 19, ylim = c(-1, 1), ylab = \"sin wave\", main = \"period = 53\")\nabline(h = 0, lwd = 2)\nplot(x, sin_106, col = 3, pch = 19, ylim = c(-1, 1), ylab = \"sin wave\", main = \"period = 106\")\nabline(h = 0, lwd = 2)\nplot(x, sin_106_2, col = 4, pch = 19, ylim = c(-1, 1), ylab = \"sin wave\", main = \"period = 106 squared\")\nabline(h = 0, lwd = 2)\n\n\n\n\n\n\n\n\nSome observations:\n\nThe sin wave (period 53) goes increases from (0, 1) and decreases all the way to -1 before coming back to 0, all within the 53 weeks in the year. But this is not what we want to achieve.\nWe want the function to increase from Jan - Jun and then start decreasing till Dec. This means, we need a regular sin-wave to span 2 years so we can see this.\nWe also want the next year to repeat the same pattern i.e. we want to restrict it to [0, 1] interval. Thus, we square the sin wave.\n\n\nfx.sin &lt;- function(datetime, f1 = fx.iso_week){\n  # identify iso week#\n  x &lt;- f1(datetime) \n  # calculate sin value for that week\n  x2 &lt;- (sin(2*pi*x/106))^2 \n  return(x2)\n}\n\nFor a GP, it’s also useful to ensure that all our X’s are between 0 and 1. Usually this is done by using the following method\nX_i^* = \\frac{X_i - \\min(X)}{\\max(X) - \\min(X) } where X = (X_1, X_2 ...X_n)\nX^* = (X_1^*, X_2^* ... X_n^*) will be the standarized X’s with all X_i^* in the interval [0, 1].\nWe can either write a function for this, or in our case, we can just divide Iso-week by 53 since that would result effectively be the same. Our Sin Predictor already lies in the interval [0, 1]."
   },
   {
-    "objectID": "VB_RegDiagTrans.html#solution-2-polynomial-regression",
-    "href": "VB_RegDiagTrans.html#solution-2-polynomial-regression",
-    "title": "VectorByte Methods Training",
-    "section": "Solution 2: Polynomial regression",
-    "text": "Solution 2: Polynomial regression\nEven though we are limited to a linear mean, it is possible to get nonlinear regression by transforming the \\(X\\) variable.\n\nIn general, we can add powers of \\(\\color{dodgerblue}X\\) to get polynomial regression: \\(\\color{red}{\\mathbb{E}[Y] = \\beta_0 + \\beta_1X + \\beta_2 X^2 + \\cdots + \\beta_m X^m}\\)\n\nYou can fit any mean function if \\(m\\) is big enough.\n\nUsually stick to m=2 unless you have a good reason."
+    "objectID": "GP_Practical.html#model-fitting",
+    "href": "GP_Practical.html#model-fitting",
+    "title": "VectorByte Methods Training: Introduction to Gaussian Processes for Time Dependent Data (Practical)",
+    "section": "Model Fitting",
+    "text": "Model Fitting\nNow, let’s start with modelling. We will start with one random location out of the 9 locations.\n\n# Choose a random site number: Anything between 1-9.\nsite_number &lt;- 6\n\n# Obtaining site name\nsite_names &lt;- unique(target$site_id)\n\n# Subsetting all the data at that location\ndf &lt;- subset(target, target$site_id == site_names[site_number])\nhead(df)\n\n# A tibble: 6 × 6\n  datetime   site_id variable             observation iso_week  week\n  &lt;date&gt;     &lt;chr&gt;   &lt;chr&gt;                      &lt;dbl&gt; &lt;chr&gt;    &lt;dbl&gt;\n1 2014-06-09 SCBI    amblyomma_americanum       75.9  2014-W24    24\n2 2014-06-30 SCBI    amblyomma_americanum       28.3  2014-W27    27\n3 2014-07-21 SCBI    amblyomma_americanum        0    2014-W30    30\n4 2014-07-28 SCBI    amblyomma_americanum       10.1  2014-W31    31\n5 2014-08-11 SCBI    amblyomma_americanum        4.94 2014-W33    33\n6 2014-10-20 SCBI    amblyomma_americanum        0    2014-W43    43\n\n\nWe will also select only those columns that we are interested in i.e. datetime and obervation. We don’t need site since we are only using one of them.\n\n# extracting only the datetime and obs columns\ndf &lt;- df[, c(\"datetime\", \"observation\")]\n\nWe will use one site at first and fit a GP and make predictions. For this we first need to divide our data into a training set and a testing set. Since we have time series, we want to divide the data sequentially, i.e. we pick a date and everything before the date is our training set and after is our testing set where we check how well our model performs. We choose the date 2020-12-31.\n\n# Selecting a date before which we consider everything as training data and after this is testing data.\ncutoff = as.Date('2020-12-31')\ndf_train &lt;- subset(df, df$datetime &lt;= cutoff)\ndf_test &lt;- subset(df, df$datetime &gt; cutoff)"
   },
   {
-    "objectID": "VB_RegDiagTrans.html#testing-for-nonlinearity",
-    "href": "VB_RegDiagTrans.html#testing-for-nonlinearity",
-    "title": "VectorByte Methods Training",
-    "section": "Testing for nonlinearity",
-    "text": "Testing for nonlinearity\nTo see if you need more nonlinearity, try the regression which includes the next polynomial term, and see if it is significant.\nFor example, to see if you need a quadratic term,\n\nfit the model then run the regression \\(\\mathbb{E}[Y] = \\beta_0 + \\beta_1 X + \\beta_2 X^2\\).\nIf your test implies \\(\\color{dodgerblue}{\\beta_2 \\neq 0}\\), you need \\(\\color{dodgerblue}{X^2}\\) in your model.\n\nNote: \\(p\\)-values are calculated “given the other \\(\\beta\\)’s are nonzero”; i.e., conditional on \\(X\\) being in the model."
+    "objectID": "GP_Practical.html#gp-model",
+    "href": "GP_Practical.html#gp-model",
+    "title": "VectorByte Methods Training: Introduction to Gaussian Processes for Time Dependent Data (Practical)",
+    "section": "GP Model",
+    "text": "GP Model\nNow we will setup our X’s. We already have the functions to do this and can simply pass in the datetime. We then combine X_1 and X_2 to create out input matrix X. Remember, everything is ordered as in our dataset.\n\n# Setting up iso-week and sin wave predictors by calling the functions\nX1 &lt;- fx.iso_week(df_train$datetime) # range is 1-53\nX2 &lt;- fx.sin(df_train$datetime) # range is 0 to 1\n\n# Centering the iso-week by diving by 53\nX1c &lt;- X1/ 53\n\n# We combine columns centered X1 and X2, into a matrix as our input space\nX &lt;- as.matrix(cbind.data.frame(X1c, X2))\nhead(X)\n\n           X1c        X2\n[1,] 0.4528302 0.9782005\n[2,] 0.5094340 0.9991219\n[3,] 0.5660377 0.9575728\n[4,] 0.5849057 0.9305218\n[5,] 0.6226415 0.8587536\n[6,] 0.8113208 0.3120862\n\n\nNext step is to tranform the response to ensure it is normal.\n\n# Extract y: observation from our training model. \ny_obs &lt;- df_train$observation\n\n# Transform the response\ny &lt;- f(y_obs)\n\nNow, we can use the laGP library to fit a GP. First, we specify priors using darg and garg. We will specify a minimum and maximum for our arguments. We need to pass the input space for darg and the output vector for garg. You can look into the functions using ?function in R. We set the minimum to a very small value rather than 0 to ensure numeric stability.\n\n# A very small value for stability\neps &lt;- sqrt(.Machine$double.eps) \n  \n# Priors for theta and g. \nd &lt;- darg(list(mle=TRUE, min =eps, max=5), X)\ng &lt;- garg(list(mle=TRUE, min = eps, max = 1), y)\n\nNow, to fit the GP, we use newGPsep. We pass the input matrix and the response vector with some values of the parameters. Then, we use the jmleGPsep function to jointly estimate \\theta and g using MLE method. dK allows the GP object to store derivative information which is needed for MLE calculations. newGPsep will fit a separable GP as opposed to newGP which would fit an isotropic GP.\n\n# Fitting a GP with our data, and some starting values for theta and g\ngpi &lt;- newGPsep(X, y, d = 0.1, g = 1, dK = T)\n\n# Jointly infer MLE for all parameters\nmle &lt;- jmleGPsep(gpi, drange = c(d$min, d$max), grange = c(g$min, g$max), \n                 dab = d$ab, gab=  g$ab)\n\nNow, we will create a grid from the first week in our dataset to 1 year into the future, and predict on the entire time series. We use predGPsep to make predictions.\n\n# Create a grid from start date in our data set to one year in future (so we forecast for next season)\nstartdate &lt;- as.Date(min(df$datetime))# identify start week\ngrid_datetime &lt;- seq.Date(startdate, Sys.Date() + 365, by = 7) # create sequence from \n\n# Build the inpu space for the predictive space (All weeks from 04-2014 to 07-2025)\nXXt1 &lt;- fx.iso_week(grid_datetime)\nXXt2 &lt;- fx.sin(grid_datetime)\n\n# Standardize\nXXt1c &lt;- XXt1/53\n\n# Store inputs as a matrix\nXXt &lt;- as.matrix(cbind.data.frame(XXt1c, XXt2))\n\n# Make predictions using predGP with the gp object and the predictive set\nppt &lt;- predGPsep(gpi, XXt) \n\nStoring the mean and calculating quantiles.\n\n# Now we store the mean as our predicted response i.e. density along with quantiles\nyyt &lt;- ppt$mean\nq1t &lt;- ppt$mean + qnorm(0.025,0,sqrt(diag(ppt$Sigma))) #lower bound\nq2t &lt;- ppt$mean + qnorm(0.975,0,sqrt(diag(ppt$Sigma))) # upper bound\n\nNow we can plot our data and predictions and see how well our model performed. We need to back transform our predictions to the original scale.\n\n# Back transform our data to original\ngp_yy &lt;- fi(yyt)\ngp_q1 &lt;- fi(q1t)\ngp_q2 &lt;- fi(q2t)\n\n# Plot the observed points\nplot(as.Date(df$datetime), df$observation,\n       main = paste(site_names[site_number]), col = \"black\",\n       xlab = \"Dates\" , ylab = \"Abundance\",\n       # xlim = c(as.Date(min(df$datetime)), as.Date(cutoff)),\n       ylim = c(min(df_train$observation, gp_yy, gp_q1), max(df_train$observation, gp_yy, gp_q2)* 1.05))\n\n# Plot the testing set data \npoints(as.Date(df_test$datetime), df_test$observation, col =\"black\", pch = 19)\n\n# Line to indicate seperation between train and test data\nabline(v = as.Date(cutoff), lwd = 2)\n\n# Add the predicted response and the quantiles\nlines(grid_datetime, gp_yy, col = 4, lwd = 2)\nlines(grid_datetime, gp_q1, col = 4, lwd = 1.2, lty = 2)\nlines(grid_datetime, gp_q2, col = 4, lwd = 1.2, lty =2)\n\n\n\n\n\n\n\n\nThat looks pretty good? We can also look at the RMSE to see how the model performs. It is better o do this on the transformed scale. We will use yyt for this. We need to find those predictions which correspond to the datetime in our testing dataset df_test.\n\n# Obtain true observed values for testing set\nyt_true &lt;- f(df_test$observation)\n\n# FInd corresponding predictions from our model in the grid we predicted on\nyt_pred &lt;- yyt[which(grid_datetime  %in% df_test$datetime)]\n\n# calculate RMSE\nrmse &lt;- sqrt(mean((yt_true - yt_pred)^2))\nrmse\n\n[1] 0.8624903"
   },
   {
-    "objectID": "VB_RegDiagTrans.html#closing-comments-on-polynomials",
-    "href": "VB_RegDiagTrans.html#closing-comments-on-polynomials",
-    "title": "VectorByte Methods Training",
-    "section": "Closing comments on polynomials",
-    "text": "Closing comments on polynomials\n\nWe can always add higher powers (cubic, etc.) if necessary.\n\nIf you add a higher order term, the lower order term is kept in the model regardless of its individual \\(t\\)-stat.\n\nBe very careful about predicting outside the data range as the curve may do unintended things beyond the data.\nWatch out for over-fitting.\n\nYou can get a “perfect” fit with enough polynomial terms,\nbut that doesn’t mean it will be any good for prediction or understanding."
+    "objectID": "GP_Practical.html#hetgp-model",
+    "href": "GP_Practical.html#hetgp-model",
+    "title": "VectorByte Methods Training: Introduction to Gaussian Processes for Time Dependent Data (Practical)",
+    "section": "HetGP Model",
+    "text": "HetGP Model\nNext, we can attempt a hetGP. We are now interested in fitting a vector of nuggets rather than a single value.\nLet’s use the same data we have to fit a hetGP. We already have our data (X, y) as well as our prediction set XXt. We use the mleHetGP command to fit a GP and pass in our data. The default covariance structure is the Squared Exponential structure. We use the predict function in base R and pass the hetGP object i.e. het_gpi to make predictions on our set XXt.\n\n# create predictors\nX1 &lt;- fx.iso_week(df_train$datetime)\nX2 &lt;- fx.sin(df_train$datetime)\n\n# standardize and put into matrix\nX1c &lt;- X1/53\nX &lt;- as.matrix(cbind.data.frame(X1c, X2))\n\n# Build prediction grid (From 04-2014 to 07-2025)\nXXt1 &lt;- fx.iso_week(grid_datetime)\nXXt2 &lt;- fx.sin(grid_datetime)\n\n# standardize and put into matrix\nXXt1c &lt;- XXt1/53\nXXt &lt;- as.matrix(cbind.data.frame(XXt1c, XXt2))\n\n# Transform the training response\ny_obs &lt;- df_train$observation\ny &lt;- f(y_obs)\n\n# Fit a hetGP model. X must be s matrix and nrow(X) should be same as length(y)\nhet_gpi &lt;- hetGP::mleHetGP(X = X, Z = y)\n\n# Predictions using the base R predict command with a hetGP object and new locationss\nhet_ppt &lt;- predict(het_gpi, XXt)\n\nNow we obtain the mean and the confidence bounds as well as transform the data to the original scale.\n\n# Mean density for predictive locations and Confidence bounds\nhet_yyt &lt;- het_ppt$mean\nhet_q1t &lt;- qnorm(0.975, het_ppt$mean, sqrt(het_ppt$sd2 + het_ppt$nugs))\nhet_q2t &lt;- qnorm(0.025, het_ppt$mean, sqrt(het_ppt$sd2 + het_ppt$nugs)) \n\n# Back transforming to original scale\nhet_yy &lt;- fi(het_yyt)\nhet_q1 &lt;- fi(het_q1t)\nhet_q2 &lt;- fi(het_q2t)\n\nWe can now plot the results similar to before. [Uncomment the code lines to see how a GP vs a HetGP fits the data]\n\n# Plot Original data\nplot(as.Date(df$datetime), df$observation,\n       main = paste(site_names[site_number]), col = \"black\",\n       xlab = \"Dates\" , ylab = \"Abundance\",\n       # xlim = c(as.Date(min(df$datetime)), as.Date(cutoff)),\n       ylim = c(min(df_train$observation, het_yy, het_q2), max(df_train$observation, het_yy, het_q1)* 1.2))\n\n# Add testing observations\npoints(as.Date(df_test$datetime), df_test$observation, col =\"black\", pch = 19)\n\n# Line to indicate our cutoff point\nabline(v = as.Date(cutoff), lwd = 2)\n\n# HetGP Model mean predictions and bounds.\nlines(grid_datetime, het_yy, col = 2, lwd = 2)\nlines(grid_datetime, het_q1, col = 2, lwd = 1.2, lty = 2)\nlines(grid_datetime, het_q2, col = 2, lwd = 1.2, lty =2)\n\n## GP model fits for the same data\n# lines(grid_datetime, gp_yy, col = 3, lwd = 2)\n# lines(grid_datetime, gp_q1, col = 3, lwd = 1.2, lty = 2)\n# lines(grid_datetime, gp_q2, col = 3, lwd = 1.2, lty =2)\n\nlegend(\"topleft\", legend = c(\"Train Y\",\"Test Y\", \"GP preds\", \"HetGP preds\"),\n         col = c(1, 1, 2, 3), lty = c(NA, NA, 1, 1),\n         pch = c(1, 19, NA, NA), cex = 0.5)\n\n\n\n\n\n\n\n\nThe mean predictions of a GP are similar to that of a hetGP; But the confidence bounds are different. A hetGP produces sligtly tighter bounds.\nWe can also compare the RMSE’s using the predictions of the hetGP model.\n\nyt_true &lt;- f(df_test$observation) # Original data\nhet_yt_pred &lt;- het_yyt[which(grid_datetime  %in% df_test$datetime)] # model preds\n\n# calculate rmse for hetGP model\nrmse_het &lt;- sqrt(mean((yt_true - het_yt_pred)^2))\nrmse_het\n\n[1] 0.8835813\n\n\nNow that we have learnt how to fit a GP and a hetGP, it’s time for a challenge.\nTry a hetGP on our sin example from before (but this time I have added noise).\n\n# Your turn\nset.seed(26)\nn &lt;- 8 # number of points\nX &lt;- matrix(seq(0, 2*pi, length= n), ncol=1) # build inputs \ny &lt;- 5*sin(X) + rnorm(n, 0 , 2) # response with some noise\n\n# Predict on this set\nXX &lt;- matrix(seq(-0.5, 2*pi + 0.5, length= 100), ncol=1)\n\n# Data visualization\nplot(X, y)\n\n\n\n\n\n\n\n# Add code to fit a hetGP model and visualise it as above"
   },
   {
-    "objectID": "VB_RegDiagTrans.html#other-problems",
-    "href": "VB_RegDiagTrans.html#other-problems",
-    "title": "VectorByte Methods Training",
-    "section": "Other problems",
-    "text": "Other problems\nSometimes we have other strange things going on in our data sets\n\ndata are “clumped” up in \\(X\\) – high leverage points\nresiduals still aren’t normally distributed after taking transforms from earlier\nresponses take discrete values instead of continuous\n\n\nThe latter 2 we can deal with using MLR and GLMs. What about the first?"
+    "objectID": "GP.html#gaussian-process-introduction",
+    "href": "GP.html#gaussian-process-introduction",
+    "title": "Introduction to Gaussian Processes for Time Dependent Data",
+    "section": "Gaussian Process: Introduction",
+    "text": "Gaussian Process: Introduction\n\n\nA Gaussian Process model is a non paramteric and flexible regression model\nIt started being used in the field of spatial statistics, where it is called kriging.\nIt is also widely used in the field of machine learning since it makes fast predictions and gives good uncertainty quantification commonly used as a surrogate model.\n\n\n\nSurrogate Models: Imagine a case where field experiments are infeasible and computer experiments take a long time to run, we can approximate the computer experiments using a surrogate model.\n\nThe ability to this model to provide good UQ makes it very useful in other fields such as ecology where the data is sparse and noisy and therefore good uncertainty measures are paramount."
   },
   {
-    "objectID": "VB_RegDiagTrans.html#the-log-log-model",
-    "href": "VB_RegDiagTrans.html#the-log-log-model",
-    "title": "VectorByte Methods Training",
-    "section": "The log-log model",
-    "text": "The log-log model\nThe other common covariate transform is \\(\\log(X)\\).\n\nWhen \\(X\\)-values are bunched up, \\(\\log(X)\\) helps spread them out and reduces the leverage of extreme values.\nRecall that both reduce \\(s_{b_1}\\).\n\nIn practice, this is often used in conjunction with a \\(\\log(Y)\\) response transformation. The log-log model is \\[\n    \\color{red}{\\log(Y) = \\beta_0 + \\beta_1 \\log(X) + \\varepsilon}.\n    \\]\nIt is super useful, and has some special properties …"
+    "objectID": "GP.html#what-is-a-gp",
+    "href": "GP.html#what-is-a-gp",
+    "title": "Introduction to Gaussian Processes for Time Dependent Data",
+    "section": "What is a GP?",
+    "text": "What is a GP?\n\n\nHere, we assume that the data come from a Multivariate Normal Distribution (MVN).\nAny normal distribution can be described by a mean vector \\mu and a covariance matrix \\Sigma.\nWe then make predictions conditional on the data.\n\n\n\n\nMathematically, we can write it as,\n\nY_{\\ n \\times 1} \\sim N \\ ( \\ \\mu(X)_{\\ n \\times 1} \\ , \\ \\Sigma(X)_{ \\ n \\times n} \\ ) Here, Y is the response of interest and n is the number of observations.\n\n\n\nOur goal is to find Y_p \\ \\vert \\ Y, X which will also be a Normal distribution.\nTo understand how it works, let’s first visualize this concept and then look into the math"
   },
   {
-    "objectID": "VB_RegDiagTrans.html#elasticity-and-the-log-log-model",
-    "href": "VB_RegDiagTrans.html#elasticity-and-the-log-log-model",
-    "title": "VectorByte Methods Training",
-    "section": "Elasticity and the log-log model",
-    "text": "Elasticity and the log-log model\nIn a log-log model, the slope \\(\\beta_1\\) is sometimes called elasticity.\nThe elasticity is (roughly) % change in \\(Y\\) per 1% change in \\(X\\). \\[\\color{dodgerblue}{\n\\beta_1 \\approx \\frac{d\\%Y}{d\\%X}}\\] For example, economists often assume that GDP has import elasticity of 1. Indeed:\n\nGDPlm&lt;-lm(log(GDP) ~ log(IMPORTS))\ncoef(GDPlm)\n#&gt;  (Intercept) log(IMPORTS) \n#&gt;     1.891516     0.969337\n\n\n(Can we test for 1%?)"
+    "objectID": "GP.html#visualizing-a-gp",
+    "href": "GP.html#visualizing-a-gp",
+    "title": "Introduction to Gaussian Processes for Time Dependent Data",
+    "section": "Visualizing a GP",
+    "text": "Visualizing a GP\n\n\n\n\n\n\n\n\n\n\n\n\n\nWe are using points closer to each other to correlate the responses.\nWhile making predictions, we average over the data around the points."
   },
   {
-    "objectID": "VB_RegDiagTrans.html#practical",
-    "href": "VB_RegDiagTrans.html#practical",
-    "title": "VectorByte Methods Training",
-    "section": "Practical",
-    "text": "Practical\nNext we’ll do a short practical to practice:\n\nFitting linear models in R\nChecking diagnostics\nChoosing transformations\nPlotting predictions"
+    "objectID": "GP.html#how-does-a-gp-work",
+    "href": "GP.html#how-does-a-gp-work",
+    "title": "Introduction to Gaussian Processes for Time Dependent Data",
+    "section": "How does a GP work",
+    "text": "How does a GP work\n\n\nAs we saw, we are averaging the data “nearby”… How do you define that?\n\n\n\n\nThis indicates that we are using distance in some way. Where…?\n\n\n\n\nRecall that in Linear Regression, you have \\ \\Sigma \\  = \\sigma^2 \\mathbb{I}\nFor a GP, the covariance matrix ( \\Sigma ) is defined by a kernel.\nConsider,\n\n\\Sigma_n = \\tau^2 C_n where C_n = \\exp \\left( - \\vert \\vert x - x' \\vert \\vert^2 \\right), and x and x' are input locations.\n\n\n\nThe covariance structure now depends on how close together the inputs. If inputs are close in distance, then the responses are more highly correlated.\nThe covariance will decay at an exponential rate as x moves away from x'."
   },
   {
-    "objectID": "VB_RegDiagTrans_practical_soln.html#fit-the-linear-regression-model.-plot-the-data-and-fitted-line.",
-    "href": "VB_RegDiagTrans_practical_soln.html#fit-the-linear-regression-model.-plot-the-data-and-fitted-line.",
-    "title": "VectorByte Methods Training",
-    "section": "1. Fit the linear regression model. Plot the data and fitted line.",
-    "text": "1. Fit the linear regression model. Plot the data and fitted line.\n\n## fit models\nattach(D &lt;- read.csv(\"data/transforms.csv\"))\nlm1 &lt;- lm(Y1 ~ X1)\nlm2 &lt;- lm(Y2 ~ X2)\nlm3 &lt;- lm(Y3 ~ X3)\nlm4 &lt;- lm(Y4 ~ X4)\n\n## plot points and lines\npar(mfrow=c(2,2), mar=c(3,2,2,1))\nplot(X1, Y1, col=1, main=\"I\"); abline(lm1, col=1)\nplot(X2, Y2, col=2, main=\"II\"); abline(lm2, col=2)\nplot(X3, Y3, col=3, main=\"III\"); abline(lm3, col=3)\nplot(X4, Y4, col=4, main=\"IV\"); abline(lm4, col=4)"
+    "objectID": "GP.html#how-to-make-predictions",
+    "href": "GP.html#how-to-make-predictions",
+    "title": "Introduction to Gaussian Processes for Time Dependent Data",
+    "section": "How to make predictions",
+    "text": "How to make predictions\n\n\nNow we will learn how to use a GP to make predictions at new locations.\nAs we learnt, we condition on the data. We can think of this as the prior.\n\n\\begin{equation}\nY_n \\ \\vert X_n \\sim \\mathcal{N} \\ ( \\ 0 \\ , \\ \\tau^2 \\ C_n(X)  \\ ) \\\\\n\\end{equation}\n\n\nNow, consider, (\\mathcal{X}, \\mathcal{Y}) as the predictive set.\n\nThe goal is to find the distribution of \\mathcal{Y} \\ \\vert X_n, Y_n which in this case is the posterior distribution.\nBy properties of Normal distribution, the posterior is also normally distributed.\n\n\n\nWe also need to write down the mean and variance of the posterior distribution so it’s ready for use."
   },
   {
-    "objectID": "VB_RegDiagTrans_practical_soln.html#provide-a-scatterplot-normal-q-q-plot-and-histogram-for-the-studentized-regression-residuals.",
-    "href": "VB_RegDiagTrans_practical_soln.html#provide-a-scatterplot-normal-q-q-plot-and-histogram-for-the-studentized-regression-residuals.",
-    "title": "VectorByte Methods Training",
-    "section": "2. Provide a scatterplot, normal Q-Q plot, and histogram for the studentized regression residuals.",
-    "text": "2. Provide a scatterplot, normal Q-Q plot, and histogram for the studentized regression residuals.\n\npar(mfrow=c(3,4), mar=c(4,4,2,0.5))   # you might have to make \n                                      # the plot window big to \n                                      # fit everything\nplot(lm1$fitted, rstudent(lm1), col=1,\n     xlab=\"Fitted Values\", ylab=\"Studentized Residuals\", \n     pch=20, main=\"I\")\nplot(lm2$fitted, rstudent(lm2), col=2,\n     xlab=\"Fitted Values\", ylab=\"Studentized Residuals\", \n     pch=20, main=\"II\")\nplot(lm3$fitted, rstudent(lm3), col=3,\n     xlab=\"Fitted Values\", ylab=\"Studentized Residuals\", \n     pch=20, main=\"III\")\nplot(lm4$fitted, rstudent(lm4), col=4,\n     xlab=\"Fitted Values\", ylab=\"Studentized Residuals\", \n     pch=20, main=\"IV\")\n\nqqnorm(rstudent(lm1), pch=20, col=1, main=\"\" )\nabline(a=0,b=1,lty=2)\nqqnorm(rstudent(lm2), pch=20, col=2, main=\"\" )\nabline(a=0,b=1,lty=2)\nqqnorm(rstudent(lm3), pch=20, col=3, main=\"\" )\nabline(a=0,b=1,lty=2)\nqqnorm(rstudent(lm4), pch=20, col=4, main=\"\" )\nabline(a=0,b=1,lty=2)\n\nhist(rstudent(lm1), col=1, xlab=\"Studentized Residuals\", \n     main=\"\", border=8)\nhist(rstudent(lm2), col=2, xlab=\"Studentized Residuals\", main=\"\")\nhist(rstudent(lm3), col=3, xlab=\"Studentized Residuals\", main=\"\")\nhist(rstudent(lm4), col=4, xlab=\"Studentized Residuals\", main=\"\")"
+    "objectID": "GP.html#how-to-make-predictions-1",
+    "href": "GP.html#how-to-make-predictions-1",
+    "title": "Introduction to Gaussian Processes for Time Dependent Data",
+    "section": "How to make predictions",
+    "text": "How to make predictions\n\n\nFirst we will “stack” the predictions and the data.\n\n\\begin{equation}\n\\begin{bmatrix}\n\\mathcal{Y} \\\\\nY_n \\\\\n\\end{bmatrix}\n\\ \\sim \\ \\mathcal{N}\n\\left(\n\\;\n\\begin{bmatrix}\n0 \\\\\n0 \\\\\n\\end{bmatrix}\\; , \\;\n\\begin{bmatrix}\n\\Sigma(\\mathcal{X}, \\mathcal{X}) & \\Sigma(\\mathcal{X}, X_n)\\\\\n\\Sigma({X_n, \\mathcal{X}}) &  \\Sigma_n\\\\\n\\end{bmatrix}\n\\;\n\\right)\n\\\\[5pt]\n\\end{equation}\n\n\n\nNow, let’s denote the predictive mean with \\mu(\\mathcal{X}) and predictive variance with \\sigma^2(\\mathcal{X})\n\n\\begin{equation}\n\\mathcal{Y} \\mid Y_n, X_n \\sim N\\left(\\mu(\\mathcal{X}) \\ , \\ \\sigma^2(\\mathcal{X})\\right)\n\\end{equation}\n\n\n\nWe will apply the properties of conditional Normal distributions.\n\n\\begin{equation}\n\\begin{aligned}\n\\mu(\\mathcal{X}) & = \\Sigma(\\mathcal{X}, X_n) \\Sigma_n^{-1} Y_n \\\\\n\\sigma^2(\\mathcal{X}) & = \\Sigma(\\mathcal{X}, \\mathcal{X}) - \\Sigma(\\mathcal{X}, X_n) \\Sigma_n^{-1} \\Sigma(X_n, \\mathcal{X}) \\\\\n\\end{aligned}\n\\end{equation}"
   },
   {
-    "objectID": "VB_RegDiagTrans_practical_soln.html#using-the-residual-scatterplots-state-how-the-slr-model-assumptions-are-violated.",
-    "href": "VB_RegDiagTrans_practical_soln.html#using-the-residual-scatterplots-state-how-the-slr-model-assumptions-are-violated.",
-    "title": "VectorByte Methods Training",
-    "section": "3. Using the residual scatterplots, state how the SLR model assumptions are violated.",
-    "text": "3. Using the residual scatterplots, state how the SLR model assumptions are violated.\nSet 1: Xs are clumpy AND the variance seems non-constant. It looks a lot like the GDP data from class. Since both Xs and Ys are strictly positive, we can try a log-log transform.\nSet 2: Data have non-constant variance – should probably log transform the Ys\nSet 3: Data have an underlying non-linear pattern. Add in an x^2 and x^3 term in this case.\nSet 4: X values are very clumpy and all positive. Try log transform of the Xs"
+    "objectID": "GP.html#hyper-parameters",
+    "href": "GP.html#hyper-parameters",
+    "title": "Introduction to Gaussian Processes for Time Dependent Data",
+    "section": "Hyper Parameters",
+    "text": "Hyper Parameters\n\n\nA GP is non parameteric, however, has some hyper-parameters as is the case with any Bayesian setup.\n\nOne of the most common kernels which we will focus on is the squared exponential distance kernel written as\nC_n = \\exp{ \\left( -\\frac{\\vert\\vert x - x' \\vert \\vert ^2}{\\theta} \\right ) + g \\mathbb{I_n}} \n\n\nRecall, \\Sigma_n = \\tau^2 C_n\nWe have three main parameters here:\n\n\\tau^2: Scale\n\\theta: Length-scale\ng: Nugget"
   },
   {
-    "objectID": "VB_RegDiagTrans_practical_soln.html#determine-the-data-transformation-to-correct-the-problems-in-3-fit-the-corresponding-regression-model-and-plot-the-transformed-data-with-new-fitted-line.",
-    "href": "VB_RegDiagTrans_practical_soln.html#determine-the-data-transformation-to-correct-the-problems-in-3-fit-the-corresponding-regression-model-and-plot-the-transformed-data-with-new-fitted-line.",
-    "title": "VectorByte Methods Training",
-    "section": "4. Determine the data transformation to correct the problems in 3, fit the corresponding regression model, and plot the transformed data with new fitted line.",
-    "text": "4. Determine the data transformation to correct the problems in 3, fit the corresponding regression model, and plot the transformed data with new fitted line.\n\n### the fixes are as follows:\nlogX1&lt;- log(X1)\nlogY1 &lt;- log(Y1)\nlogY2 &lt;- log(Y2)\nX3sq &lt;- X3^2\nX3cube&lt;-X3^3\nlogX4 &lt;- log(X4)\n\n\n### re-run the regressions and residual plots to show this worked\nlm1 &lt;- lm(logY1 ~ logX1)\nlm2 &lt;- lm(logY2 ~ X2)\nlm3 &lt;- lm(Y3 ~ X3+ X3sq + X3cube)\nlm4 &lt;- lm(Y4 ~ logX4)\n\n## plot points and lines\npar(mfrow=c(2,2), mar=c(3,2,2,1))\nplot(logX1, logY1, col=1, main=\"I\"); abline(lm1, col=1)\nplot(X2, logY2, col=2, main=\"II\"); abline(lm2, col=2)\nplot(X3, Y3, col=3, main=\"III\")\nxx3 &lt;- seq(min(X3), max(X3), length=1000)\nlines(xx3, lm3$coef[1] + lm3$coef[2]*xx3 + \n        lm3$coef[3]*xx3^2+lm3$coef[3]*xx3^3, col=3)\nplot(logX4, Y4, col=4, main=\"IV\"); abline(lm4, col=4)"
+    "objectID": "GP.html#scale",
+    "href": "GP.html#scale",
+    "title": "Introduction to Gaussian Processes for Time Dependent Data",
+    "section": "Scale",
+    "text": "Scale\n\n\nThis parameter can be used to adjust the amplitude of the data.\nA random draw from a multivariate normal distribution with \\tau^2 = 1 will produce data between -2 and 2.\n\n\n\n\nNow let’s visualize what happens when we increase \\tau^2 to 25."
   },
   {
-    "objectID": "VB_RegDiagTrans_practical_soln.html#provide-plots-to-show-that-your-transformations-have-mostly-fixed-the-model-violations.",
-    "href": "VB_RegDiagTrans_practical_soln.html#provide-plots-to-show-that-your-transformations-have-mostly-fixed-the-model-violations.",
-    "title": "VectorByte Methods Training",
-    "section": "5. Provide plots to show that your transformations have (mostly) fixed the model violations.",
-    "text": "5. Provide plots to show that your transformations have (mostly) fixed the model violations.\n\npar(mfrow=c(3,4), mar=c(4,4,2,0.5))  \nplot(lm1$fitted, rstudent(lm1), col=1,\n     xlab=\"Fitted Values\", ylab=\"Studentized Residuals\", \n     pch=20, main=\"I\")\nplot(lm2$fitted, rstudent(lm2), col=2,\n     xlab=\"Fitted Values\", ylab=\"Studentized Residuals\", \n     pch=20, main=\"II\")\nplot(lm3$fitted, rstudent(lm3), col=3,\n     xlab=\"Fitted Values\", ylab=\"Studentized Residuals\", \n     pch=20, main=\"III\")\nplot(lm4$fitted, rstudent(lm4), col=4,\n     xlab=\"Fitted Values\", ylab=\"Studentized Residuals\", \n     pch=20, main=\"IV\")\n\n## Q-Q plots\nqqnorm(rstudent(lm1), pch=20, col=1, main=\"\" )\nabline(a=0,b=1,lty=2)\nqqnorm(rstudent(lm2), pch=20, col=2, main=\"\" )\nabline(a=0,b=1,lty=2)\nqqnorm(rstudent(lm3), pch=20, col=3, main=\"\" )\nabline(a=0,b=1,lty=2)\nqqnorm(rstudent(lm4), pch=20, col=4, main=\"\" )\nabline(a=0,b=1,lty=2)\n\n## histograms of studentized residuals\nhist(rstudent(lm1), col=1, xlab=\"Studentized Residuals\", \n     main=\"\", border=8)\nhist(rstudent(lm2), col=2, xlab=\"Studentized Residuals\", main=\"\")\nhist(rstudent(lm3), col=3, xlab=\"Studentized Residuals\", main=\"\")\nhist(rstudent(lm4), col=4, xlab=\"Studentized Residuals\", main=\"\")"
+    "objectID": "GP.html#length-scale",
+    "href": "GP.html#length-scale",
+    "title": "Introduction to Gaussian Processes for Time Dependent Data",
+    "section": "Length-scale",
+    "text": "Length-scale\n\n\nThis parameter controls the rate of decay of correlation.\nLarger \\theta will result in wigglier functions.\n\n\n\nLet’s also visualize different values of \\theta."
   },
   {
-    "objectID": "VB_IntroTimeDepData_practical.html#exploring-the-data",
-    "href": "VB_IntroTimeDepData_practical.html#exploring-the-data",
-    "title": "VectorByte Methods Training",
-    "section": "Exploring the Data",
-    "text": "Exploring the Data\nAs always, we first want to take a look at the data, to make sure we understand it, and that we don’t have missing or weird values.\n\nmozData&lt;-read.csv(\"data/Culex_erraticus_walton_covariates_aggregated.csv\")\nsummary(mozData)\n\n   Month_Yr          sample_value        MaxTemp          Precip      \n Length:36          Min.   :0.00000   Min.   :16.02   Min.   : 0.000  \n Class :character   1st Qu.:0.04318   1st Qu.:22.99   1st Qu.: 2.162  \n Mode  :character   Median :0.73001   Median :26.69   Median : 4.606  \n                    Mean   :0.80798   Mean   :26.23   Mean   : 5.595  \n                    3rd Qu.:1.22443   3rd Qu.:30.70   3rd Qu.: 7.864  \n                    Max.   :3.00595   Max.   :33.31   Max.   :18.307  \n\n\nWe can see that the minimum observed average number of mosquitoes it zero, and max is only 3 (there are likely many zeros averaged over many days in the month). There don’t appear to be any NAs in the data. In this case the dataset itself is small enough that we can print the whole thing to ensure it’s complete:\n\nmozData\n\n   Month_Yr sample_value  MaxTemp       Precip\n1   2015-01  0.000000000 17.74602  3.303991888\n2   2015-02  0.018181818 17.87269 16.544265802\n3   2015-03  0.468085106 23.81767  2.405651215\n4   2015-04  1.619047619 26.03559  8.974406168\n5   2015-05  0.821428571 30.01602  0.567960943\n6   2015-06  3.005952381 31.12094  4.841342729\n7   2015-07  2.380952381 32.81130  3.849010353\n8   2015-08  1.826347305 32.56245  5.562845324\n9   2015-09  0.648809524 30.55155 10.409724627\n10  2015-10  0.988023952 27.22605  0.337750269\n11  2015-11  0.737804878 24.86768 18.306749680\n12  2015-12  0.142857143 22.46588  5.621475377\n13  2016-01  0.000000000 16.02406  3.550622029\n14  2016-02  0.020202020 19.42057 11.254680803\n15  2016-03  0.015151515 23.13610  4.785664728\n16  2016-04  0.026143791 24.98082  4.580424519\n17  2016-05  0.025252525 28.72884  0.053057634\n18  2016-06  0.833333333 30.96990  6.155417473\n19  2016-07  1.261363636 33.30509  4.496368193\n20  2016-08  1.685279188 32.09633 11.338749182\n21  2016-09  2.617142857 31.60575  2.868288451\n22  2016-10  1.212121212 29.14275  0.000000000\n23  2016-11  1.539772727 24.48482  0.005462681\n24  2016-12  0.771573604 20.46054 11.615521725\n25  2017-01  0.045454545 18.35473  0.000000000\n26  2017-02  0.036363636 23.65584  3.150710053\n27  2017-03  0.194285714 22.53573  1.430094952\n28  2017-04  0.436548223 26.15299  0.499381616\n29  2017-05  1.202020202 28.00173  6.580562663\n30  2017-06  0.834196891 29.48951 13.333939858\n31  2017-07  1.765363128 32.25135  7.493927035\n32  2017-08  0.744791667 31.86476  6.082113434\n33  2017-09  0.722222222 30.60566  4.631037395\n34  2017-10  0.142131980 27.73453 11.567112214\n35  2017-11  0.289772727 23.23140  1.195760473\n36  2017-12  0.009174312 18.93603  4.018254442"
+    "objectID": "GP.html#nugget",
+    "href": "GP.html#nugget",
+    "title": "Introduction to Gaussian Processes for Time Dependent Data",
+    "section": "Nugget",
+    "text": "Nugget\n\n\nIt is responsible for introducing noise into the covariance structure so there is some discontinuity in the data.\nWe will compare a sample from g ~ 0 (&lt; 1e-8 for numeric stability) vs g = 0.1 to observe what actually happens.\n\n\n\n\n\n\n\n\n\n\n\n\n\nThis parameter prevents interpolation which in turn yields better UQ."
   },
   {
-    "objectID": "VB_IntroTimeDepData_practical.html#plotting-the-data",
-    "href": "VB_IntroTimeDepData_practical.html#plotting-the-data",
-    "title": "VectorByte Methods Training",
-    "section": "Plotting the data",
-    "text": "Plotting the data\nFirst we’ll examine the data itself, including the predictors:\n\nmonths&lt;-dim(mozData)[1]\nt&lt;-1:months ## counter for months in the data set\npar(mfrow=c(3,1))\nplot(t, mozData$sample_value, type=\"l\", lwd=2, \n     main=\"Average Monthly Abundance\", \n     xlab =\"Time (months)\", \n     ylab = \"Average Count\")\nplot(t, mozData$MaxTemp, type=\"l\",\n     col = 2, lwd=2, \n     main=\"Average Maximum Temp\", \n     xlab =\"Time (months)\", \n     ylab = \"Temperature (C)\")\nplot(t, mozData$Precip, type=\"l\",\n     col=\"dodgerblue\", lwd=2,\n     main=\"Average Monthly Precip\", \n     xlab =\"Time (months)\", \n     ylab = \"Precipitation (in)\")\n\n\n\n\n\n\n\n\nVisually we noticed that there may be a bit of clumping in the values for abundance (this is subtle) – in particular, since we have a lot of very small/nearly zero counts, a transform, such as a square root, may spread things out for the abundances. It also looks like both the abundance and temperature data are more cyclical than the precipitation, and thus more likely to be related to each other. There’s also not visually a lot of indication of a trend, but it’s usually worthwhile to consider it anyway. Replotting the abundance data with a transformation:\n\nmonths&lt;-dim(mozData)[1]\nt&lt;-1:months ## counter for months in the data set\nplot(t, sqrt(mozData$sample_value), type=\"l\", lwd=2, \n     main=\"Sqrt Average Monthly Abundance\", \n     xlab =\"Time (months)\", \n     ylab = \"Average Count\")\n\n\n\n\n\n\n\n\nThat looks a little bit better. I suggest we go with this for our response."
+    "objectID": "GP.html#toy-example-1d-example",
+    "href": "GP.html#toy-example-1d-example",
+    "title": "Introduction to Gaussian Processes for Time Dependent Data",
+    "section": "Toy Example (1D Example)",
+    "text": "Toy Example (1D Example)\n\n\n\nX &lt;- matrix(seq(0, 2*pi, length = 100), ncol =1)\nn &lt;- nrow(X) \ntrue_y &lt;- 5 * sin(X)\nobs_y &lt;- true_y + rnorm(n, sd=1)\n\npar(mfrow = c(1, 1), mar = c(5, 5, 4, 2), cex.axis = 2, cex.lab = 2, cex.main = 3, font.lab = 2)\nplot(X, obs_y, ylim = c(-10, 10), main = \"GP fit\", xlab = \"X\", ylab = \"Y\",\n     cex = 1.5, pch = 16)\nlines(X, true_y, col = 2, lwd = 3)"
   },
   {
-    "objectID": "VB_IntroTimeDepData_practical.html#building-a-data-frame",
-    "href": "VB_IntroTimeDepData_practical.html#building-a-data-frame",
-    "title": "VectorByte Methods Training",
-    "section": "Building a data frame",
-    "text": "Building a data frame\nBefore we get into model building, we always want to build a data frame to contain all of the predictors that we want to consider, at the potential lags that we’re interested in. In the lecture we saw building the AR, sine/cosine, and trend predictors:\n\nt &lt;- 2:months ## to make building the AR1 predictors easier\n\nmozTS &lt;- data.frame(\n  Y=sqrt(mozData$sample_value[t]), # transformed response\n  Yl1=sqrt(mozData$sample_value[t-1]), # AR1 predictor\n  t=t, # trend predictor\n  sin12=sin(2*pi*t/12), \n  cos12=cos(2*pi*t/12) # periodic predictors\n  )\n\nWe will also put in the temperature and precipitation predictors. But we need to think about what might be an appropriate lag. If this were daily or weekly data, we’d probably want to have a fairly sizable lag – mosquitoes take a while to develop, so the number we see today is not likely related to the temperature today. However, since these data are agregated across a whole month, as is the temperature/precipitaion, the current month values are likely to be useful. However, it’s even possible that last month’s values may be so we’ll add those in as well:\n\nmozTS$MaxTemp&lt;-mozData$MaxTemp[t] ## current temps\nmozTS$MaxTempl1&lt;-mozData$MaxTemp[t-1] ## previous temps\nmozTS$Precip&lt;-mozData$Precip[t] ## current precip\nmozTS$Precipl1&lt;-mozData$Precip[t-1] ## previous precip\n\nThus our full dataframe:\n\nsummary(mozTS)\n\n       Y               Yl1               t            sin12         \n Min.   :0.0000   Min.   :0.0000   Min.   : 2.0   Min.   :-1.00000  \n 1st Qu.:0.2951   1st Qu.:0.2951   1st Qu.:10.5   1st Qu.:-0.68301  \n Median :0.8590   Median :0.8590   Median :19.0   Median : 0.00000  \n Mean   :0.7711   Mean   :0.7684   Mean   :19.0   Mean   :-0.01429  \n 3rd Qu.:1.1120   3rd Qu.:1.1120   3rd Qu.:27.5   3rd Qu.: 0.68301  \n Max.   :1.7338   Max.   :1.7338   Max.   :36.0   Max.   : 1.00000  \n     cos12             MaxTemp        MaxTempl1         Precip      \n Min.   :-1.00000   Min.   :16.02   Min.   :16.02   Min.   : 0.000  \n 1st Qu.:-0.68301   1st Qu.:23.18   1st Qu.:23.18   1st Qu.: 1.918  \n Median : 0.00000   Median :27.23   Median :27.23   Median : 4.631  \n Mean   :-0.02474   Mean   :26.47   Mean   :26.44   Mean   : 5.660  \n 3rd Qu.: 0.50000   3rd Qu.:30.79   3rd Qu.:30.79   3rd Qu.: 8.234  \n Max.   : 1.00000   Max.   :33.31   Max.   :33.31   Max.   :18.307  \n    Precipl1     \n Min.   : 0.000  \n 1st Qu.: 1.918  \n Median : 4.631  \n Mean   : 5.640  \n 3rd Qu.: 8.234  \n Max.   :18.307  \n\n\n\nhead(mozTS)\n\n          Y       Yl1 t         sin12         cos12  MaxTemp MaxTempl1\n1 0.1348400 0.0000000 2  8.660254e-01  5.000000e-01 17.87269  17.74602\n2 0.6841675 0.1348400 3  1.000000e+00  6.123234e-17 23.81767  17.87269\n3 1.2724180 0.6841675 4  8.660254e-01 -5.000000e-01 26.03559  23.81767\n4 0.9063270 1.2724180 5  5.000000e-01 -8.660254e-01 30.01602  26.03559\n5 1.7337683 0.9063270 6  1.224647e-16 -1.000000e+00 31.12094  30.01602\n6 1.5430335 1.7337683 7 -5.000000e-01 -8.660254e-01 32.81130  31.12094\n      Precip   Precipl1\n1 16.5442658  3.3039919\n2  2.4056512 16.5442658\n3  8.9744062  2.4056512\n4  0.5679609  8.9744062\n5  4.8413427  0.5679609\n6  3.8490104  4.8413427"
+    "objectID": "GP.html#toy-example-1d-example-1",
+    "href": "GP.html#toy-example-1d-example-1",
+    "title": "Introduction to Gaussian Processes for Time Dependent Data",
+    "section": "Toy Example (1D Example)",
+    "text": "Toy Example (1D Example)\n\n\neps &lt;- sqrt(.Machine$double.eps)\ngpi &lt;- laGP::newGP(X = X,Z = obs_y, d = 0.1, g = 0.1 * var(obs_y), dK = TRUE) \nmle &lt;- laGP::mleGP(gpi = gpi, param = c(\"d\", \"g\"), tmin= c(eps, eps), tmax= c(10, var(obs_y))) \n\nXX &lt;- matrix(seq(0, 2*pi, length = 1000), ncol =1)\np &lt;- laGP::predGP(gpi = gpi, XX = XX)"
   },
   {
-    "objectID": "VB_IntroTimeDepData_practical.html#building-a-first-model",
-    "href": "VB_IntroTimeDepData_practical.html#building-a-first-model",
-    "title": "VectorByte Methods Training",
-    "section": "Building a first model",
-    "text": "Building a first model\nWe will first build a very simple model – just a trend – to practice building the model, checking diagnostics, and plotting predictions.\n\nmod1&lt;-lm(Y ~ t, data=mozTS)\nsummary(mod1)\n\n\nCall:\nlm(formula = Y ~ t, data = mozTS)\n\nResiduals:\n     Min       1Q   Median       3Q      Max \n-0.81332 -0.47902  0.03671  0.37384  0.87119 \n\nCoefficients:\n             Estimate Std. Error t value Pr(&gt;|t|)    \n(Intercept)  0.904809   0.178421   5.071  1.5e-05 ***\nt           -0.007038   0.008292  -0.849    0.402    \n---\nSignif. codes:  0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1\n\nResidual standard error: 0.4954 on 33 degrees of freedom\nMultiple R-squared:  0.02136,   Adjusted R-squared:  -0.008291 \nF-statistic: 0.7204 on 1 and 33 DF,  p-value: 0.4021\n\n\nThe model output indicates that this model is not useful – the trend is not significant and it only explains about 2% of the variability. Let’s plot the predictions:\n\n## plot points and fitted lines\nplot(Y~t, data=mozTS, col=1, type=\"l\")\nlines(t, mod1$fitted, col=\"dodgerblue\", lwd=2)\n\n\n\n\n\n\n\n\nNot good – we’ll definitely need to try something else! Remember that since we’re using a linear model for this, that we should check our residual plots as usual, and then also plot the acf of the residuals:\n\npar(mfrow=c(1,3), mar=c(4,4,2,0.5))   \n\n## studentized residuals vs fitted\nplot(mod1$fitted, rstudent(mod1), col=1,\n     xlab=\"Fitted Values\", \n     ylab=\"Studentized Residuals\", \n     pch=20, main=\"AR 1 only model\")\n\n## qq plot of studentized residuals\nqqnorm(rstudent(mod1), pch=20, col=1, main=\"\" )\nabline(a=0,b=1,lty=2, col=2)\n\n## histogram of studentized residuals\nhist(rstudent(mod1), col=1, \n     xlab=\"Studentized Residuals\", \n     main=\"\", border=8)\n\n\n\n\n\n\n\n\nThis doesn’t look really bad, although the histogram might be a bit weird. Finally the acf\n\nacf(mod1$residuals)\n\n\n\n\n\n\n\n\nThis is where we can see that we definitely aren’t able to capture the pattern. There’s substantial autocorrelation left at a 1 month lag, and around 6 months.\nFinally, for moving forward, we can extract the BIC for this model so that we can compare with other models that you’ll build next.\n\nn&lt;-length(t)\nextractAIC(mod1, k=log(n))[2]\n\n[1] -44.11057"
+    "objectID": "GP.html#anisotropic-gaussian-processes",
+    "href": "GP.html#anisotropic-gaussian-processes",
+    "title": "Introduction to Gaussian Processes for Time Dependent Data",
+    "section": "Anisotropic Gaussian Processes",
+    "text": "Anisotropic Gaussian Processes\nSuppose our data is multi-dimensional, we can control the length-scale (\\theta) for each dimension.\nIn this situation, we can rewrite the C_n matrix as,\nC_\\theta(x , x') = \\exp{ \\left( -\\sum_{k=1}^{m} \\frac{ (x_k - x_k')^2 }{\\theta_k} \\right ) + g \\mathbb{I_n}}\nHere, \\theta = (\\theta_1, \\theta_2, …, \\theta_m) is a vector of length-scales, where m = dimension of the input space.\n\nWe can adjust the decay of correlation per dimension."
   },
   {
-    "objectID": "schedule2024.html",
-    "href": "schedule2024.html",
-    "title": "2024 Training Schedule",
-    "section": "",
-    "text": "Main materials\n\nPre-workshop\nInformation about pre-workshop preparation – including software installation, expectations for what you should already be familiar with, and review materials – is available in the pre-work portion of the materials page.\n  \n\n\n22 July 2024\n\n\n\nTime\nActivity\nMaterials\n\n\n\n\n\nArrival\n\n\n\n\n  \n\n\n23 July 2024 (08:30 - 17:30)\n\n\n\n\n\n\n\n\nTime\nActivity\nMaterials\n\n\n\n\n8:30\nIntroduction to time dependent data, course overview\n\n\n\n9:30\nGoal setting, lighting presentations\n\n\n\n10:15\nBreak\n\n\n\n10:45\nLecture: Regression Transformations and Diagnostics\n\n\n\n11:45\nPractical: Regression Transformations and Diagnostics\n\n\n\n12:30\nLunch\n\n\n\n13:30\nLecture: Time Dependent Data Analysis\n\n\n\n14:30\nPractical: Time Dependent Data Analysis\n\n\n\n15:15\nBreak\n\n\n\n15:30\nIntegrated Lecture and Practical: Basics of Time Series method\n\n\n\n\n  \n\n\n24 July 2024 (08:30 - 17:30)\n\n\n\n\n\n\n\n\nTime\nActivity\nMaterials\n\n\n\n\n8:30\nOverview of the day\n\n\n\n9:00\nIntroduction to VecDyn Database and API\n\n\n\n10:00\nBreak\n\n\n\n10:30\nWorking with VecDyn/time dependent data (data aggregation, covariate/predictor sources)\n\n\n\n12:30\nLunch\n\n\n\n13:30\nLecture: Introduction to Gaussian Process (GP) regression applied to time dependent data\n\n\n\n14:45\nBreak\n\n\n\n15:15\nPractical: GPs in R with laGP and hetGP\n\n\n\n16:30\nBrainstorming planning for projects\n\n\n\n17:00\nLightning talks\n\n\n\n\n  \n\n\n25 July 2024 (08:30 - 17:30)\n\n\n\n\n\n\n\n\nTime.\nActivity\nMaterials\n\n\n\n\n8:30\nOverview of the day\n\n\n\n9:00\nForecasting metrics and challenge introduction\n\n\n\n9:30\nForecasting Challenge\n\n\n\n10:30\nBreak\n\n\n\n11:00\nForecasting Challenge (cont)\n\n\n\n11:45\nPresent and Eval forecasts\n\n\n\n12:30\nLunch\n\n\n\n13:30\nMini projects\n\n\n\n15:00\nBreak\n\n\n\n15:30\nMini projects\n\n\n\n16:30\nPresent mini projects; wrap up\n\n\n\n\n  \n\n\n26 July 2024\n\n\n\nTime\nActivity\nMaterials\n\n\n\n\n\nTravel\n\n\n\n\n\n\nPost-workshop\nEnjoy using these new techniques and databases!"
+    "objectID": "GP.html#heteroskedastic-gaussian-processes",
+    "href": "GP.html#heteroskedastic-gaussian-processes",
+    "title": "Introduction to Gaussian Processes for Time Dependent Data",
+    "section": "Heteroskedastic Gaussian Processes",
+    "text": "Heteroskedastic Gaussian Processes\n\n\nHeteroskedasticity implies that the data is noisy, and thee noise is irregular.\n\n\n\n\n\n\n\n\n\n\n\n\n\nA Heteroskedastic Gaussian Process (hetGP) is used when the data is noisy.\nNoise is usually input dependent and may vary with one or more predictors"
   },
   {
-    "objectID": "VB_RegDiagTrans_practical.html#fit-the-linear-regression-model.-plot-the-data-and-fitted-line.",
-    "href": "VB_RegDiagTrans_practical.html#fit-the-linear-regression-model.-plot-the-data-and-fitted-line.",
-    "title": "VectorByte Methods Training",
-    "section": "1. Fit the linear regression model. Plot the data and fitted line.",
-    "text": "1. Fit the linear regression model. Plot the data and fitted line.\n\n## fit models\nlm1 &lt;- lm(Y1 ~ X1)\n\n## plot points and fitted lines\nplot(X1, Y1, col=1, main=\"I\"); abline(lm1, col=2)"
+    "objectID": "GP.html#hetgp-setup",
+    "href": "GP.html#hetgp-setup",
+    "title": "Introduction to Gaussian Processes for Time Dependent Data",
+    "section": "HetGP Setup",
+    "text": "HetGP Setup\n\nLet Y_n be the response vector of size n. Let X = (X_1, X_2 ... X_n) be the input space.\nThen, a regular GP is written as:\n\n\\begin{align*}\nY_N \\ & \\ \\sim GP \\left( 0 \\ , \\tau^2 C_n  \\right); \\ \\text{where, }\\\\[2pt]\nC_n  & \\ = \\exp{ \\left( -\\frac{\\vert\\vert x - x' \\vert \\vert ^2}{\\theta} \\right ) + g \\mathbb{I_n}}\n\\end{align*}\n\n\n\nIn case of a hetGP, we have:\n\n\\begin{aligned}\nY_n\\ & \\ \\sim GP \\left( 0 \\ , \\tau^2 C_{n, \\Lambda}  \\right) \\ \\ \\text{where, }\\\\[2pt]\nC_{n, \\Lambda}  & \\ = \\exp{ \\left( -\\frac{\\vert\\vert x - x' \\vert \\vert ^2}{\\theta} \\right ) + \\Lambda_n} \\ \\ \\ \\text{and, }\\ \\\\[2pt]\n\\ \\ \\Lambda_n \\  & \\ = \\ \\text{Diag}(\\lambda_1, \\lambda_2 ... , \\lambda_n) \\\\[2pt]\n\\end{aligned}\n\n\nInstead of one nugget for the GP, we have a vector of nuggets i.e. a unique nugget for each unique input.\n\n\n\n\nWe can make predictions exactly as seen in case of a GP in Equation(4) with \n\\begin{aligned}\n\\Sigma(X) \\ & \\ = \\nu \\left( \\ K_{\\theta_Y}(X) + \\Lambda_N(X) \\  \\right) \\\\[2pt]\n\\end{aligned}"
   },
   {
-    "objectID": "VB_RegDiagTrans_practical.html#provide-a-scatterplot-normal-q-q-plot-and-histogram-for-the-studentized-regression-residuals.",
-    "href": "VB_RegDiagTrans_practical.html#provide-a-scatterplot-normal-q-q-plot-and-histogram-for-the-studentized-regression-residuals.",
-    "title": "VectorByte Methods Training",
-    "section": "2. Provide a scatterplot, normal Q-Q plot, and histogram for the studentized regression residuals.",
-    "text": "2. Provide a scatterplot, normal Q-Q plot, and histogram for the studentized regression residuals.\n\npar(mfrow=c(1,3), mar=c(4,4,2,0.5))   \n\n## studentized residuals vs fitted\nplot(lm1$fitted, rstudent(lm1), col=1,\n     xlab=\"Fitted Values\", \n     ylab=\"Studentized Residuals\", \n     pch=20, main=\"I\")\n\n## qq plot of studentized residuals\nqqnorm(rstudent(lm1), pch=20, col=1, main=\"\" )\nabline(a=0,b=1,lty=2, col=2)\n\n## histogram of studentized residuals\nhist(rstudent(lm1), col=1, \n     xlab=\"Studentized Residuals\", \n     main=\"\", border=8)"
+    "objectID": "GP.html#toy-example-1d-example-2",
+    "href": "GP.html#toy-example-1d-example-2",
+    "title": "Introduction to Gaussian Processes for Time Dependent Data",
+    "section": "Toy Example (1D Example)",
+    "text": "Toy Example (1D Example)"
   },
   {
-    "objectID": "VB_RegDiagTrans_practical.html#using-the-residual-scatterplots-state-how-the-slr-model-assumptions-are-violated.",
-    "href": "VB_RegDiagTrans_practical.html#using-the-residual-scatterplots-state-how-the-slr-model-assumptions-are-violated.",
-    "title": "VectorByte Methods Training",
-    "section": "3. Using the residual scatterplots, state how the SLR model assumptions are violated.",
-    "text": "3. Using the residual scatterplots, state how the SLR model assumptions are violated.\nXs are clumpy AND the variance seems non-constant. It looks a lot like the GDP data from class. Since both Xs and Ys are strictly positive, we can try a log-log transform."
+    "objectID": "GP.html#toy-example-1d-example-3",
+    "href": "GP.html#toy-example-1d-example-3",
+    "title": "Introduction to Gaussian Processes for Time Dependent Data",
+    "section": "Toy Example (1D Example)",
+    "text": "Toy Example (1D Example)"
   },
   {
-    "objectID": "VB_RegDiagTrans_practical.html#determine-the-data-transformation-to-correct-the-problems-in-3-fit-the-corresponding-regression-model-and-plot-the-transformed-data-with-new-fitted-line.",
-    "href": "VB_RegDiagTrans_practical.html#determine-the-data-transformation-to-correct-the-problems-in-3-fit-the-corresponding-regression-model-and-plot-the-transformed-data-with-new-fitted-line.",
-    "title": "VectorByte Methods Training",
-    "section": "4. Determine the data transformation to correct the problems in 3, fit the corresponding regression model, and plot the transformed data with new fitted line.",
-    "text": "4. Determine the data transformation to correct the problems in 3, fit the corresponding regression model, and plot the transformed data with new fitted line.\n\n### the fix is as follows:\nlogX1&lt;- log(X1)\nlogY1 &lt;- log(Y1)\n\n### re-run the regressions and residual plots to show this worked\nlm1 &lt;- lm(logY1 ~ logX1)\n\n## plot points and lines\nplot(logX1, logY1, col=1, main=\"I\"); abline(lm1, col=2)"
+    "objectID": "GP.html#toy-example-1d-example-4",
+    "href": "GP.html#toy-example-1d-example-4",
+    "title": "Introduction to Gaussian Processes for Time Dependent Data",
+    "section": "Toy Example (1D Example)",
+    "text": "Toy Example (1D Example)"
   },
   {
-    "objectID": "VB_RegDiagTrans_practical.html#provide-plots-to-show-that-your-transformations-have-mostly-fixed-the-model-violations.",
-    "href": "VB_RegDiagTrans_practical.html#provide-plots-to-show-that-your-transformations-have-mostly-fixed-the-model-violations.",
-    "title": "VectorByte Methods Training",
-    "section": "5. Provide plots to show that your transformations have (mostly) fixed the model violations.",
-    "text": "5. Provide plots to show that your transformations have (mostly) fixed the model violations.\n\n## studentized residuals vs fitted\n\npar(mfrow=c(1,3), mar=c(4,4,2,0.5))  \nplot(lm1$fitted, rstudent(lm1), col=1,\n     xlab=\"Fitted Values\", \n     ylab=\"Studentized Residuals\", \n     pch=20, main=\"I\")\n\n## Q-Q plots\nqqnorm(rstudent(lm1), pch=20, col=1, main=\"\" )\nabline(a=0,b=1,lty=2, col=2)\n\n## histograms of studentized residuals\nhist(rstudent(lm1), col=1, \n     xlab=\"Studentized Residuals\", \n     main=\"\", border=8)\n\n\n\n\n\n\n\n\nThis is much better! The histogram still maybe looks a little funny, but given that the qq-plot looks pretty good, I think we’ve made a good transformation."
+    "objectID": "GP.html#intro-to-ticks-problem",
+    "href": "GP.html#intro-to-ticks-problem",
+    "title": "Introduction to Gaussian Processes for Time Dependent Data",
+    "section": "Intro to Ticks Problem",
+    "text": "Intro to Ticks Problem\n\nEFI-RCN held an ecological forecasting challenge\nWe focus on the Tick Populations theme which studies the abundance of the lone star tick (Amblyomma americanum)\n\nSome details about the challenge:\n\nObjective: Forecast tick density for 4 weeks into the future\nSites: The data is collected across 9 different sites, each plot was of size 1600m^2 using a drag cloth\nData: Sparse and irregularly spaced. We only have ~650 observations across 10 years at 9 locations"
   },
   {
-    "objectID": "VB_RegDiagTrans_practical.html#your-turn",
-    "href": "VB_RegDiagTrans_practical.html#your-turn",
-    "title": "VectorByte Methods Training",
-    "section": "Your Turn!",
-    "text": "Your Turn!\nRepeat this process with the other 3 datasets, and see if you can figure out a appropriate transformations for each dataset."
+    "objectID": "GP.html#predictors",
+    "href": "GP.html#predictors",
+    "title": "Introduction to Gaussian Processes for Time Dependent Data",
+    "section": "Predictors",
+    "text": "Predictors\n\nX_1 Iso-week: The week in which the tick density was recorded.\nX_2 Sine wave: \\left( \\text{sin} \\ ( \\frac{2 \\ \\pi \\ X_1}{106} ) \\right)^2."
   },
   {
-    "objectID": "VB_TimeDepData.html#learning-objectives",
-    "href": "VB_TimeDepData.html#learning-objectives",
-    "title": "VectorByte Methods Training",
-    "section": "Learning Objectives",
-    "text": "Learning Objectives"
+    "objectID": "GP.html#practical",
+    "href": "GP.html#practical",
+    "title": "Introduction to Gaussian Processes for Time Dependent Data",
+    "section": "Practical",
+    "text": "Practical\n\nSetup these predictors\nTransform the data to normal\nFit a GP to the Data\nMake Predictions on a testing set\nCheck how predictions perform."
   },
   {
-    "objectID": "VB_TimeDepData.html#time-dependent-data",
-    "href": "VB_TimeDepData.html#time-dependent-data",
+    "objectID": "VB_RegDiagTrans_practical_soln.html#fit-the-linear-regression-model.-plot-the-data-and-fitted-line.",
+    "href": "VB_RegDiagTrans_practical_soln.html#fit-the-linear-regression-model.-plot-the-data-and-fitted-line.",
     "title": "VectorByte Methods Training",
-    "section": "Time Dependent Data",
-    "text": "Time Dependent Data\nMuch of the data we collect in VBD applications depends on time such as\n\nobserved cases in a city or country\nnumber of mosquitoes over time\n\nAdditionally, we often assume that the reasons these change over time may be because covariates (e.g., temperature, precipitation, insecticide spraying) change over time.\nHow do we incorporate these time varying factors into our regression models?"
+    "section": "1. Fit the linear regression model. Plot the data and fitted line.",
+    "text": "1. Fit the linear regression model. Plot the data and fitted line.\n\n## fit models\nattach(D &lt;- read.csv(\"data/transforms.csv\"))\nlm1 &lt;- lm(Y1 ~ X1)\nlm2 &lt;- lm(Y2 ~ X2)\nlm3 &lt;- lm(Y3 ~ X3)\nlm4 &lt;- lm(Y4 ~ X4)\n\n## plot points and lines\npar(mfrow=c(2,2), mar=c(3,2,2,1))\nplot(X1, Y1, col=1, main=\"I\"); abline(lm1, col=1)\nplot(X2, Y2, col=2, main=\"II\"); abline(lm2, col=2)\nplot(X3, Y3, col=3, main=\"III\"); abline(lm3, col=3)\nplot(X4, Y4, col=4, main=\"IV\"); abline(lm4, col=4)"
   },
   {
-    "objectID": "VB_TimeDepData.html#types-of-time-dependent-data",
-    "href": "VB_TimeDepData.html#types-of-time-dependent-data",
+    "objectID": "VB_RegDiagTrans_practical_soln.html#provide-a-scatterplot-normal-q-q-plot-and-histogram-for-the-studentized-regression-residuals.",
+    "href": "VB_RegDiagTrans_practical_soln.html#provide-a-scatterplot-normal-q-q-plot-and-histogram-for-the-studentized-regression-residuals.",
     "title": "VectorByte Methods Training",
-    "section": "Types of time dependent data",
-    "text": "Types of time dependent data\nThe most common type of time-dependent data that statisticians talk about is time series data. These are data where observations are evenly spaced with no (or very little) missing observations.\n\nAlthough evenly spaced data are ideal (and the most common methods are designed for them), in VBD survey data we often don’t have evenly spaced observations. These data don’t have a specific name, and most time-series methods can’t be directly used with them."
+    "section": "2. Provide a scatterplot, normal Q-Q plot, and histogram for the studentized regression residuals.",
+    "text": "2. Provide a scatterplot, normal Q-Q plot, and histogram for the studentized regression residuals.\n\npar(mfrow=c(3,4), mar=c(4,4,2,0.5))   # you might have to make \n                                      # the plot window big to \n                                      # fit everything\nplot(lm1$fitted, rstudent(lm1), col=1,\n     xlab=\"Fitted Values\", ylab=\"Studentized Residuals\", \n     pch=20, main=\"I\")\nplot(lm2$fitted, rstudent(lm2), col=2,\n     xlab=\"Fitted Values\", ylab=\"Studentized Residuals\", \n     pch=20, main=\"II\")\nplot(lm3$fitted, rstudent(lm3), col=3,\n     xlab=\"Fitted Values\", ylab=\"Studentized Residuals\", \n     pch=20, main=\"III\")\nplot(lm4$fitted, rstudent(lm4), col=4,\n     xlab=\"Fitted Values\", ylab=\"Studentized Residuals\", \n     pch=20, main=\"IV\")\n\nqqnorm(rstudent(lm1), pch=20, col=1, main=\"\" )\nabline(a=0,b=1,lty=2)\nqqnorm(rstudent(lm2), pch=20, col=2, main=\"\" )\nabline(a=0,b=1,lty=2)\nqqnorm(rstudent(lm3), pch=20, col=3, main=\"\" )\nabline(a=0,b=1,lty=2)\nqqnorm(rstudent(lm4), pch=20, col=4, main=\"\" )\nabline(a=0,b=1,lty=2)\n\nhist(rstudent(lm1), col=1, xlab=\"Studentized Residuals\", \n     main=\"\", border=8)\nhist(rstudent(lm2), col=2, xlab=\"Studentized Residuals\", main=\"\")\nhist(rstudent(lm3), col=3, xlab=\"Studentized Residuals\", main=\"\")\nhist(rstudent(lm4), col=4, xlab=\"Studentized Residuals\", main=\"\")"
   },
   {
-    "objectID": "VB_TimeDepData.html#time-series-data-and-dependence",
-    "href": "VB_TimeDepData.html#time-series-data-and-dependence",
+    "objectID": "VB_RegDiagTrans_practical_soln.html#using-the-residual-scatterplots-state-how-the-slr-model-assumptions-are-violated.",
+    "href": "VB_RegDiagTrans_practical_soln.html#using-the-residual-scatterplots-state-how-the-slr-model-assumptions-are-violated.",
     "title": "VectorByte Methods Training",
-    "section": "Time series data and dependence",
-    "text": "Time series data and dependence\nTime-series data are simply a collection of observations gathered over time. For example, suppose \\(y_1, \\ldots, y_T\\) are\n\ndaily temperature,\nsolar activity,\nCO\\(_2\\) levels,\nyearly population size.\n\nIn each case, we might expect what happens at time \\(t\\) to be correlated with time \\(t-1\\)."
+    "section": "3. Using the residual scatterplots, state how the SLR model assumptions are violated.",
+    "text": "3. Using the residual scatterplots, state how the SLR model assumptions are violated.\nSet 1: Xs are clumpy AND the variance seems non-constant. It looks a lot like the GDP data from class. Since both Xs and Ys are strictly positive, we can try a log-log transform.\nSet 2: Data have non-constant variance – should probably log transform the Ys\nSet 3: Data have an underlying non-linear pattern. Add in an x^2 and x^3 term in this case.\nSet 4: X values are very clumpy and all positive. Try log transform of the Xs"
   },
   {
-    "objectID": "VB_TimeDepData.html#checking-for-dependence",
-    "href": "VB_TimeDepData.html#checking-for-dependence",
+    "objectID": "VB_RegDiagTrans_practical_soln.html#determine-the-data-transformation-to-correct-the-problems-in-3-fit-the-corresponding-regression-model-and-plot-the-transformed-data-with-new-fitted-line.",
+    "href": "VB_RegDiagTrans_practical_soln.html#determine-the-data-transformation-to-correct-the-problems-in-3-fit-the-corresponding-regression-model-and-plot-the-transformed-data-with-new-fitted-line.",
     "title": "VectorByte Methods Training",
-    "section": "Checking for dependence",
-    "text": "Checking for dependence\nTo see if \\(Y_{t-1}\\) would be useful for predicting \\(Y_t\\), just plot them together and see if there is a relationship.\n\n\n\n\n\n\n\n\n\n\n\n\n\n\nCorrelation between \\(Y_t\\) and \\(Y_{t-1}\\) is called autocorrelation."
+    "section": "4. Determine the data transformation to correct the problems in 3, fit the corresponding regression model, and plot the transformed data with new fitted line.",
+    "text": "4. Determine the data transformation to correct the problems in 3, fit the corresponding regression model, and plot the transformed data with new fitted line.\n\n### the fixes are as follows:\nlogX1&lt;- log(X1)\nlogY1 &lt;- log(Y1)\nlogY2 &lt;- log(Y2)\nX3sq &lt;- X3^2\nX3cube&lt;-X3^3\nlogX4 &lt;- log(X4)\n\n\n### re-run the regressions and residual plots to show this worked\nlm1 &lt;- lm(logY1 ~ logX1)\nlm2 &lt;- lm(logY2 ~ X2)\nlm3 &lt;- lm(Y3 ~ X3+ X3sq + X3cube)\nlm4 &lt;- lm(Y4 ~ logX4)\n\n## plot points and lines\npar(mfrow=c(2,2), mar=c(3,2,2,1))\nplot(logX1, logY1, col=1, main=\"I\"); abline(lm1, col=1)\nplot(X2, logY2, col=2, main=\"II\"); abline(lm2, col=2)\nplot(X3, Y3, col=3, main=\"III\")\nxx3 &lt;- seq(min(X3), max(X3), length=1000)\nlines(xx3, lm3$coef[1] + lm3$coef[2]*xx3 + \n        lm3$coef[3]*xx3^2+lm3$coef[3]*xx3^3, col=3)\nplot(logX4, Y4, col=4, main=\"IV\"); abline(lm4, col=4)"
   },
   {
-    "objectID": "VB_TimeDepData.html#autocorrelation-for-time-series-data",
-    "href": "VB_TimeDepData.html#autocorrelation-for-time-series-data",
+    "objectID": "VB_RegDiagTrans_practical_soln.html#provide-plots-to-show-that-your-transformations-have-mostly-fixed-the-model-violations.",
+    "href": "VB_RegDiagTrans_practical_soln.html#provide-plots-to-show-that-your-transformations-have-mostly-fixed-the-model-violations.",
     "title": "VectorByte Methods Training",
-    "section": "Autocorrelation (for time series data)",
-    "text": "Autocorrelation (for time series data)\nTo summarize the time-varying dependence, compute lag-\\(\\ell\\) correlations for \\(\\ell=1,2,3,\\ldots\\)\nIn general, the autocorrelation function (ACF) for \\(Y\\) is \\[\\color{red}{r(\\ell) = \\mathrm{cor}(Y_t, Y_{t-\\ell})}\\]\nFor our Roanoke temperature data:\n\nprint(acf(weather$temp))\n\n     0      1      2      3      4      5      6      7      8    \n 1.000  0.658  0.298  0.263  0.297  0.177  0.111  0.008 -0.099   \n    9     10    11     12     13     14     15     16     17 \n-0.045 0.071 -0.020 -0.157 -0.156 -0.146 -0.278 -0.346 -0.314"
+    "section": "5. Provide plots to show that your transformations have (mostly) fixed the model violations.",
+    "text": "5. Provide plots to show that your transformations have (mostly) fixed the model violations.\n\npar(mfrow=c(3,4), mar=c(4,4,2,0.5))  \nplot(lm1$fitted, rstudent(lm1), col=1,\n     xlab=\"Fitted Values\", ylab=\"Studentized Residuals\", \n     pch=20, main=\"I\")\nplot(lm2$fitted, rstudent(lm2), col=2,\n     xlab=\"Fitted Values\", ylab=\"Studentized Residuals\", \n     pch=20, main=\"II\")\nplot(lm3$fitted, rstudent(lm3), col=3,\n     xlab=\"Fitted Values\", ylab=\"Studentized Residuals\", \n     pch=20, main=\"III\")\nplot(lm4$fitted, rstudent(lm4), col=4,\n     xlab=\"Fitted Values\", ylab=\"Studentized Residuals\", \n     pch=20, main=\"IV\")\n\n## Q-Q plots\nqqnorm(rstudent(lm1), pch=20, col=1, main=\"\" )\nabline(a=0,b=1,lty=2)\nqqnorm(rstudent(lm2), pch=20, col=2, main=\"\" )\nabline(a=0,b=1,lty=2)\nqqnorm(rstudent(lm3), pch=20, col=3, main=\"\" )\nabline(a=0,b=1,lty=2)\nqqnorm(rstudent(lm4), pch=20, col=4, main=\"\" )\nabline(a=0,b=1,lty=2)\n\n## histograms of studentized residuals\nhist(rstudent(lm1), col=1, xlab=\"Studentized Residuals\", \n     main=\"\", border=8)\nhist(rstudent(lm2), col=2, xlab=\"Studentized Residuals\", main=\"\")\nhist(rstudent(lm3), col=3, xlab=\"Studentized Residuals\", main=\"\")\nhist(rstudent(lm4), col=4, xlab=\"Studentized Residuals\", main=\"\")"
   },
   {
-    "objectID": "VB_TimeDepData.html#autoregression",
-    "href": "VB_TimeDepData.html#autoregression",
-    "title": "VectorByte Methods Training",
-    "section": "Autoregression",
-    "text": "Autoregression\nHow do we model data that exhibits autocorrelation?\nSuppose \\(Y_1 = \\varepsilon_1\\), \\(Y_2 = \\varepsilon_{1} + \\varepsilon_{2}\\), \\(Y_3 = \\varepsilon_{1} + \\varepsilon_{2} + \\varepsilon_{3}\\), etc.\n\nThen \\(\\color{dodgerblue}{Y_t =  \\sum_{i=1}^{t}\\varepsilon_i = Y_{t-1} + \\varepsilon_t}\\) and \\(\\color{dodgerblue}{ \\mathbb{E}[Y_t] = Y_{t-1}}\\).\n\nThis is called a random walk model for \\(Y_t\\):\n\nthe expectation of what will happen is always what happened most recently."
+    "objectID": "GP_Notes.html",
+    "href": "GP_Notes.html",
+    "title": "VectorByte Methods Training: Introduction to Gaussian Processes for Time Dependent Data (notes)",
+    "section": "",
+    "text": "This document introduces the conceptual background to Gaussian Process (GP) regression, along with mathematical concepts. We also demonstrate briefly fitting GPs using the laGP package in R. The material here is intended to give a more verbose introduction to what is covered in the lecture in order to support a student to work through the practical component. This material has been adapted from chapter 5 of the book Surrogates: Gaussian process modeling, design and optimization for the applied sciences by Robert Gramacy."
   },
   {
-    "objectID": "VB_TimeDepData.html#random-walk",
-    "href": "VB_TimeDepData.html#random-walk",
-    "title": "VectorByte Methods Training",
-    "section": "Random walk",
-    "text": "Random walk\nIn a random walk, the series just wanders around.\n\n\\(\\beta_1 = 1\\)"
+    "objectID": "GP_Notes.html#gaussian-process-prior",
+    "href": "GP_Notes.html#gaussian-process-prior",
+    "title": "VectorByte Methods Training: Introduction to Gaussian Processes for Time Dependent Data (notes)",
+    "section": "Gaussian Process Prior",
+    "text": "Gaussian Process Prior\nIn our setup, we assume that the data follows a Multivariate Normal Distribution. We can think of this as a Prior. Mathematically, we can write it as:\nY_n \\sim N \\ ( \\ \\mu \\ , \\ \\Sigma_n \\ )\nHere, Y and \\mu is an n \\times 1 vector and \\Sigma_n is a positive semi definite matrix. This means that,\nx^T \\Sigma_n x &gt; 0 \\ \\text{ for all } \\ x \\neq 0.\nFor our purposes, we will consider \\mu = 0.\nIn Simple Linear Regression, we assume \\Sigma_n = \\sigma^2 \\mathbb{I}. This means that Y_1 \\ , Y_2 \\ \\ ... \\ \\ Y_n are uncorrelated with each other. However, In a GP, we assume that there is some correlation between the responses. A common covariance function is the squared exponential kernel, which invovles the Euclidean distance i.e. for two inputs x and x', the correlation is defined as,\n\\Sigma(x, x') = \\exp \\left( \\ \\vert \\vert{x - x'} \\vert \\vert^2 \\ \\right)\nThis creates a positive semi-definite correlation kernel. It also uses the proximity of x and x' as a measure of correlation i.e. the closer two points in the input space are, the more highly their corresponding responses are correlated. We will learn the exact form of \\Sigma_n later in the tutorial. First, we need to learn about MVN Distribution and the Posterior Distribution given the data."
   },
   {
-    "objectID": "VB_TimeDepData.html#exploding-series",
-    "href": "VB_TimeDepData.html#exploding-series",
-    "title": "VectorByte Methods Training",
-    "section": "Exploding series",
-    "text": "Exploding series\nFor AR term \\(&gt;1\\), the \\(Y_t\\)’s move exponentially far from \\(Y_1\\).\n\n\\(\\beta_1 = 1.02\\)\n\n\n\nUseless for modeling and prediction."
+    "objectID": "GP_Notes.html#multivariate-normal-distribution",
+    "href": "GP_Notes.html#multivariate-normal-distribution",
+    "title": "VectorByte Methods Training: Introduction to Gaussian Processes for Time Dependent Data (notes)",
+    "section": "Multivariate Normal Distribution",
+    "text": "Multivariate Normal Distribution\nSuppose we have X = (X_1, X_2)\n\\begin{equation}\nX =\n\\begin{bmatrix}\nX_1 \\\\\nX_2 \\\\\n\\end{bmatrix} \\; , \\;\n\\mu =\n\\begin{bmatrix}\n\\mu_1\\\\\n\\mu_2\\\\\n\\end{bmatrix}\\; , \\;\n\\end{equation} where X_1 and \\mu_1 are q \\times 1 and X_2 and \\mu_2 are (N-q)   \\times 1.\n\\begin{equation}\n\\Sigma =\n\\begin{bmatrix}\n\\Sigma_{11} & \\Sigma_{12}\\\\\n\\Sigma_{21} &  \\Sigma_{22}\\\\\n\\end{bmatrix}\n\\; \\; \\;\n\\\\[5pt]\n\\text{with dimensions } \\; \\;\n\\begin{bmatrix}\nq \\times q & q \\times (N-q) \\\\\n(N -q) \\times q &  (N-q) \\times (N-q)\\\\\n\\end{bmatrix}\n\\;\n\\end{equation}\nThen, we have\n\\begin{equation}\n\\begin{bmatrix}\nX_1 \\\\\nX_2 \\\\\n\\end{bmatrix}\n\\ \\sim \\ \\mathcal{N}\n\\left(\n\\;\n\\begin{bmatrix}\n\\mu_1 \\\\\n\\mu_2 \\\\\n\\end{bmatrix}\\; , \\;\n\\begin{bmatrix}\n\\Sigma_{11} & \\Sigma_{12}\\\\\n\\Sigma_{21} &  \\Sigma_{22}\\\\\n\\end{bmatrix}\n\\;\n\\right)\n\\\\[5pt]\n\\end{equation}\nNow we can derive the conditional distribution of X_1 \\vert X_2 using properties of MVN.\nX_1 \\vert X_2 \\ \\sim \\mathcal{N} (\\mu_{X_1 \\vert X_2}, \\ \\Sigma_{X_1 \\vert X_2})\nwhere,\n\\mu_{X_1 \\vert X_2} = \\mu_1 + \\Sigma_{12}\\Sigma_{22}^{-1}(x_2 - \\mu_2)\n\\Sigma_{X_1 \\vert X_2} = \\Sigma_{11} - \\Sigma_{12}\\Sigma_{22}^{-1} \\Sigma_{21}\nNow, let’s look at this in our context.\nSuppose we have, D_n = (X_n, Y_n) where Y_n \\sim N \\ ( \\ 0 \\ , \\ \\Sigma_n \\ ). Now, for a new location x_p, we need to find the distribution ofY(x_p).\nWe want to find the distribution of Y(x_p) \\ \\vert \\ D_n. Using the information from above, we know this is normally distributed and we need to identify then mean and variance. Thus, we have\n\\begin{equation}\n\\begin{aligned}\nY(x_p) \\vert \\ D_n \\ & \\sim \\mathcal{N} \\left(\\mu(x_p) \\ , \\ \\sigma^2(x_p) \\right) \\; \\; \\text{where, }\\\\[3pt]\n\\mu(x_p) \\ & = \\Sigma(x_p, X_n) \\Sigma_n^{-1}Y_n \\; \\;\\\\[3pt]\n\\sigma^2(x_p) \\ & = \\Sigma(x_p, x_p) - \\Sigma(x_p, X_n) \\Sigma_n^{-1}\\Sigma(X_n, x_p) \\\\[3pt]\n\\end{aligned}\n\\end{equation}"
   },
   {
-    "objectID": "VB_TimeDepData.html#stationary-series",
-    "href": "VB_TimeDepData.html#stationary-series",
-    "title": "VectorByte Methods Training",
-    "section": "Stationary series",
-    "text": "Stationary series\nFor \\(\\beta_1&lt;1\\), \\(Y_t\\) is always pulled back towards the mean.\n\n\\(\\beta_1 = 0.8\\)\n\n\n\nThese are the most common and useful type of AR series."
+    "objectID": "GP_Notes.html#example-gp-for-toy-example",
+    "href": "GP_Notes.html#example-gp-for-toy-example",
+    "title": "VectorByte Methods Training: Introduction to Gaussian Processes for Time Dependent Data (notes)",
+    "section": "Example: GP for Toy Example",
+    "text": "Example: GP for Toy Example\nSuppose we have data from the following function, Y(x) = 5 \\ \\sin (x)\nNow we use the above, and try and obtain Y(x_p) \\vert Y. Here is a visual of what a GP prediction for this function looks like. Each gray line is a draw from our predicted normal distribution, the blue line is the truth and the black line is the mean prediction from our GP. The red lines are confidence bounds. Pretty good? Let’s learn how we do that."
   },
   {
-    "objectID": "VB_TimeDepData.html#mean-reversion",
-    "href": "VB_TimeDepData.html#mean-reversion",
-    "title": "VectorByte Methods Training",
-    "section": "Mean reversion",
-    "text": "Mean reversion\nAn important property of stationary series is mean reversion.\nThink about shifting both \\(Y_t\\) and \\(Y_{t-1}\\) by their mean \\(\\mu\\). \\[\n\\color{dodgerblue}{Y_t - \\mu = \\beta_1 (Y_{t-1} - \\mu) +\\varepsilon_t}\n\\] Since \\(|\\beta_1| &lt; 1\\), \\(Y_t\\) is expected to be closer to \\(\\mu\\) than \\(Y_{t-1}\\).\nMean reversion is all over, and helps predict future behavior:\n\nweekly sales numbers,\ndaily temperature."
+    "objectID": "GP_Notes.html#covariance-function",
+    "href": "GP_Notes.html#covariance-function",
+    "title": "VectorByte Methods Training: Introduction to Gaussian Processes for Time Dependent Data (notes)",
+    "section": "Covariance Function",
+    "text": "Covariance Function\nAs mentioned before, the main action is in the specification of \\Sigma_n. Let’s express \\Sigma_n = \\tau^2 C_n where C_n is the correlation function. We will be using the squared exponential distance based correlation function. The kernel can be written down mathematically as,\nC_n = \\exp{ \\left( -\\frac{\\vert\\vert x - x' \\vert \\vert ^2}{\\theta} \\right ) + g \\mathbb{I_n}} \nHere, if x and x' are closer in distance, the responses are more highly correlated. Along with our input space we also notice three other paramters; which in this context are referred to as hyper-parameters as they are used for fine-tuning our predictions as opposed to directly affecting them.\nWe have three main hyper-parameters here:\n\n\\tau^2: Scale\nThis parameter dictates the amplitude of our function. A MVN Distribution with scale = 1 will usually have data between -2 to 2. As the scale increases, this range expands. Here is a plo that shows two different scales for the same function, with all other parameters fixed.\n\nlibrary(mvtnorm)\nlibrary(laGP)\n\nset.seed(24)\nn &lt;- 100\nX &lt;- as.matrix(seq(0, 20, length.out = n))\nDx &lt;- laGP::distance(X)\n\ng &lt;- sqrt(.Machine$double.eps)\nCn &lt;- (exp(-Dx) + diag(g, n))\n\nY &lt;- rmvnorm(1, sigma = Cn)\n\nset.seed(28)\ntau2 &lt;- 25\nY_scaled &lt;- rmvnorm(1, sigma = tau2 * Cn)\n\npar(mfrow = c(1, 2), mar = c(5, 5, 4, 2), cex.axis = 2, cex.lab = 2, cex.main = 3, font.lab = 2)\n\n# Plot 1\nmatplot(X, t(Y), type = 'l', main = expression(paste(tau^2, \" = 1\")), \n        ylab = \"Y\", xlab = \"X\", lwd = 2, col = \"blue\")\n\n# Plot 2\nmatplot(X, t(Y_scaled), type = 'l', main = expression(paste(tau^2, \" = 25\")), \n        ylab = \"Y\", xlab = \"X\", lwd = 2, col = \"red\")\n\n\n\n\n\n\n\n\n\n\n\\theta: Length-scale\nThe length-scale controls the wiggliness of the function. It is also referred to as the rate of decay of correlation. The smaller it’s value, the more wiggly the function gets. This is because we expect the change in directionalilty of the function to be rather quick. We will once again demonstrate how a difference in magnitude of \\theta affects the function, keeping everything else constant.\n\nset.seed(1)\nn &lt;- 100\nX &lt;- as.matrix(seq(0, 10, length.out = n))\nDx &lt;- laGP::distance(X)\n\ng &lt;- sqrt(.Machine$double.eps)\ntheta1 &lt;- 0.5\nCn &lt;- (exp(-Dx/theta1) + diag(g, n))\n\nY &lt;- rmvnorm(1, sigma = Cn)\n\ntheta2 &lt;- 5\nCn &lt;- (exp(-Dx/theta2) + diag(g, n))\n\nY2 &lt;- rmvnorm(1, sigma = Cn)\n\npar(mfrow = c(1, 2), mar = c(5, 5, 4, 2), cex.axis = 2, cex.lab = 2, cex.main = 3, font.lab = 2)\nmatplot(X, t(Y), type= 'l', main = expression(paste(theta, \" = 0.5\")),\n     ylab = \"Y\", ylim = c(-2.2, 2.2), lwd = 2, col = \"blue\")\nmatplot(X, t(Y2), type= 'l',  main = expression(paste(theta, \" = 5\")),\n     ylab = \"Y\", ylim = c(-2.2, 2.2), lwd = 2, col = \"red\")\n\n\n\n\n\n\n\n\nAn extenstion: Anisotropic GP\nIn a multi-dimensional input setup, where X_{n \\times m} = (\\underline{X}_1, ... \\underline{X}_m). Here, the input space is m-dimensional and we have n observations. We can adjust the kernel so that each dimension has it’s own \\theta i.e. the rate of decay of correlation is different from one dimension to another. This can be done by simply modifying the correlation function, and writing it as,\nC_n = \\exp{ \\left( - \\sum_{k=1}^{m}  \\frac{\\vert\\vert x - x' \\vert \\vert ^2}{\\theta_k} \\right ) + g \\mathbb{I_n}} \nThis type of modelling is also referred to a seperable GP since we can take the sum outside the exponent and it will be a product of m independent dimensions. If we set all \\theta_k= \\theta, it would be an isotropic GP.\n\n\ng: Nugget\nThis parameter adds some noise into the function. For g &gt; 0, it determines the magnitude of discontinuity as x' tends to x. It is also called the nugget effect. For g=0, there would be no noise and the function would interpolate between the points. This effect is only added to the diagonals of the correlation matrix. We never add g to the off-diagonal elements. This also allows for numeric stability. Below is a snippet of what different magnitudes of g look like.\n\nlibrary(mvtnorm)\nlibrary(laGP)\n\nn &lt;- 100\nX &lt;- as.matrix(seq(0, 10, length.out = n))\nDx &lt;- laGP::distance(X)\n\ng &lt;- sqrt(.Machine$double.eps)\nCn &lt;- (exp(-Dx) + diag(g, n))\nY &lt;- rmvnorm(1, sigma = Cn)\n\nCn &lt;- (exp(-Dx) + diag(1e-2, n))\n\nL &lt;- rmvnorm(1, sigma = diag(1e-2, n))\nY2 &lt;- Y + L\n\npar(mfrow = c(1, 2), mar = c(5, 5, 4, 2), cex.axis = 2, cex.lab = 2, cex.main = 3, font.lab = 2)\nplot(X, t(Y), main = expression(paste(g, \" &lt; 1e-8\")),\n     ylab = \"Y\", xlab = \"X\", pch = 19, cex = 1.5, col = 1)\nlines(X, t(Y), col = \"blue\", lwd = 3) \n\nplot(X, t(Y2), main = expression(paste(g, \" = 0.01\")),\n     ylab = \"Y\", xlab = \"X\", pch = 19, cex = 1.5, col = 1)\nlines(X, t(Y), col = \"blue\", lwd = 3)\n\n\n\n\n\n\n\n\nAn extension: Heteroskedastic GP\nWe will study this in some detail later, but here instead of using one nugget g for the entire model, we use a vector of nuggets \\Lambda; one unique nugget for each unique input i.e. simply put, a different value gets added to each diagonal element.\nBack to GP fitting\nFor now, let’s get back to GP and fitting and learn how to use it. We have already seen a small example of the laGP package in action. However, we had not used any of the hyper-parameters in that case. We assumed to know all the information. However, that is not always the case. Without getting into the nitty-gritty details, here is how we obtain our parameters when we have some real data D_n = (X_n, Y_n).\n\ng and \\theta: An estimate can be obtained using MLE method by maximizing the likelihood. This is done using numerical algorithms.\n\\tau^2: An estimate is obtained as a closed form solution once we plug in g."
   },
   {
-    "objectID": "VB_TimeDepData.html#negative-correlation",
-    "href": "VB_TimeDepData.html#negative-correlation",
-    "title": "VectorByte Methods Training",
-    "section": "Negative correlation",
-    "text": "Negative correlation\nIt is also possible to have negatively correlated AR(1) series.\n\n\\(\\beta_1 = -0.8\\)\n\n\n\nBut you see these far less often in practice."
+    "objectID": "VB_RegDiagTrans.html#learning-objectives",
+    "href": "VB_RegDiagTrans.html#learning-objectives",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "Learning Objectives",
+    "text": "Learning Objectives\n\nReview assumptions of SLR/MLR models\nReview using diagnostic plots to assess whether assumptions are met\nReview the idea of basic transformations to use when assumptions aren’t met"
   },
   {
-    "objectID": "VB_TimeDepData.html#summary-of-ar1-behavior",
-    "href": "VB_TimeDepData.html#summary-of-ar1-behavior",
-    "title": "VectorByte Methods Training",
-    "section": "Summary of AR(1) behavior",
-    "text": "Summary of AR(1) behavior\n\n\\(\\color{dodgerblue}{|\\beta_1|&lt;1|}\\): The series has a mean level to which it reverts over time (stationary). For \\(+\\beta_1\\), the series tends to wander above or below the mean level for a while. For \\(-\\beta_1\\), the series tends to flip back and forth around the mean.\n\\(\\color{dodgerblue}{|\\beta_1|=1|}\\): A random walk series. The series has no mean level and, thus, is called nonstationary. The drift parameter \\(\\beta_0\\) is the direction in which the series wanders.\n\\(\\color{dodgerblue}{|\\beta_1|&gt;1|}\\): The series explodes, is nonstationary, and pretty much useless for prediction."
+    "objectID": "VB_RegDiagTrans.html#slr-model-assumptions",
+    "href": "VB_RegDiagTrans.html#slr-model-assumptions",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "SLR model assumptions",
+    "text": "SLR model assumptions\n\\[\nY_i |X_i \\stackrel{ind}{\\sim} \\mathcal{N}(\\beta_0 + \\beta_1 X_i, \\sigma^2)\n\\]\nRecall the key assumptions of the Simple Linear Regression model:\n\nThe conditional mean of \\(Y\\) is linear in \\(X\\).\nThe additive errors (deviations from line)\n\nare normally distributed\nindependent from each other\nidentically distributed (i.e., they have constant variance)"
   },
   {
-    "objectID": "VB_TimeDepData.html#arp-models",
-    "href": "VB_TimeDepData.html#arp-models",
-    "title": "VectorByte Methods Training",
-    "section": "AR(\\(p\\)) models",
-    "text": "AR(\\(p\\)) models\nIt is possible to expand the AR idea to higher lags \\[\n\\color{red}{AR(p): Y_t = \\beta_0 + \\beta_1Y_{t-1} + \\cdots + \\beta_pY_{t-p} + \\varepsilon}.\n\\]\nHowever, it is seldom necessary to fit AR lags for \\(p&gt;1\\).\n\nLike having polynomial terms higher than 2, this just isn’t usually required in practice.\nYou lose all of the stationary/nonstationary intuition.\nOften, the need for higher lags is symptomatic of (missing) a more persistent trend or periodicity in the data, or needing predictors ..."
+    "objectID": "VB_RegDiagTrans.html#example-model-violations",
+    "href": "VB_RegDiagTrans.html#example-model-violations",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "Example model violations",
+    "text": "Example model violations\nAnscombe’s quartet comprises four datasets that have similar statistical properties …\n\n\n\n\nXmean\nYmean\nXsd\nYsd\nXYcor\n\n\n\n\n1\n9.000\n7.501\n3.317\n2.032\n0.816\n\n\n2\n9.000\n7.501\n3.317\n2.032\n0.816\n\n\n3\n9.000\n7.500\n3.317\n2.030\n0.816\n\n\n4\n9.000\n7.501\n3.317\n2.031\n0.817"
   },
   {
-    "objectID": "VB_TimeDepData.html#trending-series",
-    "href": "VB_TimeDepData.html#trending-series",
-    "title": "VectorByte Methods Training",
-    "section": "Trending series",
-    "text": "Trending series\nOften, you’ll have a linear trend in your time series.\n\\(\\Rightarrow\\) AR structure, sloping up or down in time."
+    "objectID": "VB_RegDiagTrans.html#residuals-and-the-model-assumptions",
+    "href": "VB_RegDiagTrans.html#residuals-and-the-model-assumptions",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "Residuals and the model assumptions",
+    "text": "Residuals and the model assumptions\nRecall that the linear regression model assumes \\[\nY_i =\\beta_0 + \\beta_1 X_i + \\varepsilon_i,~~\\mbox{where}~~\n\\varepsilon_i \\stackrel{iid}{\\sim} \\mathcal{N}(0,\\sigma^2).\n\\]\nOur goal is to determine if the “true” residuals are iid normal and unrelated to \\(X\\). If the SLR model assumptions are true, then the residuals must be just “white noise”:\n\nEach \\(\\varepsilon_i\\) has the same variance (\\(\\sigma^2\\)).\nEach \\(\\varepsilon_i\\) has the same mean (0).\nAll of the \\(\\varepsilon_i\\) have the same normal distribution."
   },
   {
-    "objectID": "VB_TimeDepData.html#periodic-models",
-    "href": "VB_TimeDepData.html#periodic-models",
-    "title": "VectorByte Methods Training",
-    "section": "Periodic models",
-    "text": "Periodic models\nIt is very common to see seasonality or periodicity in series.\n\nTemperature goes up in Summer and down in Winter.\nGas consumption in Blacksburg would do the opposite.\n\nRecall the monthly lung infection data:\n\n\n\n\n\n\n\n\n\n\n\n\n\n\nAppears to oscillate on a 12-month cycle."
+    "objectID": "VB_RegDiagTrans.html#understanding-leverage",
+    "href": "VB_RegDiagTrans.html#understanding-leverage",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "Understanding Leverage",
+    "text": "Understanding Leverage\nThe \\(h_i\\) leverage term measures sensitivity of the estimated least squares regression line to changes in \\(Y_i\\).\nThe term “leverage” provides a mechanical intuition:\n\nThe farther you are from a pivot joint, the more torque you have pulling on a lever.\n\nHere is a nice online (interactive) illustration of leverage:\n\nhttps://omaymas.shinyapps.io/Influence_Analysis/\n\n\nOutliers do more damage if they have high leverage!"
   },
   {
-    "objectID": "VB_TimeDepData.html#alternative-periodicity",
-    "href": "VB_TimeDepData.html#alternative-periodicity",
-    "title": "VectorByte Methods Training",
-    "section": "Alternative Periodicity",
-    "text": "Alternative Periodicity\nAn alternative way to add periodicity would be to simply add a dummy variable for each month (feb, mar, apr, ...).\n\nThis achieves basically the same fit as above, without requiring you to add sine or cosine.\nHowever, this takes 11 periodic parameters while we use only 2."
+    "objectID": "VB_RegDiagTrans.html#standardized-residuals",
+    "href": "VB_RegDiagTrans.html#standardized-residuals",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "Standardized residuals",
+    "text": "Standardized residuals\nSince \\(e_i \\sim N(0, \\sigma^2 [1-h_i])\\), we know that \\[\n\\color{red}{\\frac{e_i}{\\sigma \\sqrt{1-h_i} }\\sim N(0, 1)}.\n\\]\nThese transformed \\(e_i\\)’s are called the standardized residuals.\n\nThey all have the same distribution if the SLR model assumptions are true.\nThey are almost (close enough) independent (\\(\\stackrel{iid}{\\sim}N(0,1)\\)).\nEstimate \\(\\sigma^2 \\approx s^2 = \\frac{1}{n-p}\\sum_{j=1}^n e_j^2\\). (\\(p=2\\) for SLR)"
   },
   {
-    "objectID": "VB_TimeDepData.html#non-time-series-data",
-    "href": "VB_TimeDepData.html#non-time-series-data",
-    "title": "VectorByte Methods Training",
-    "section": "Non-time series data",
-    "text": "Non-time series data\n\nWhat happens if data aren’t evenly sampled?\n\n\nAll of the models/tools we explored that incorporate auto-correlation are not valid if data are not evenly spaced.\n\nYou can’t calculate an auto-correlation if the gap between data points and the earlier points aren’t all the same because we don’t expect all lags to have the same correlation.\n\n\nSo what can we do?"
+    "objectID": "VB_RegDiagTrans.html#studentized-residuals",
+    "href": "VB_RegDiagTrans.html#studentized-residuals",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "Studentized residuals",
+    "text": "Studentized residuals\nWe thus define a standard Studentized residual as \\[\nr_i = \\frac{e_i}{s_{-i} \\sqrt{1-h_i} }\\sim t_{n-p-1}(0, 1)\n\\] where \\(s_{-i}^2 = \\frac{1}{n-p-1}\\sum_{j \\neq i} e_j^2\\) is \\(\\hat{\\sigma~}^2\\) calculated without \\(e_i\\).\n\nThese are easy to get in R with the rstudent() function:\n\nas.numeric(rstudent(reg3))\n#&gt;  [1]   -0.43905545   -0.18550224 1203.53946383   -0.31384418   -0.57429485\n#&gt;  [6]   -1.15598185    0.06640743    0.36185145   -0.73567703   -0.06576806\n#&gt; [11]    0.20026336"
   },
   {
-    "objectID": "VB_TimeDepData.html#time-dependent-predictors",
-    "href": "VB_TimeDepData.html#time-dependent-predictors",
-    "title": "VectorByte Methods Training",
-    "section": "Time Dependent Predictors",
-    "text": "Time Dependent Predictors\nOften we have additional measurements of possible covariates that might impact the time-dependent responses that we want to model. E.g. in VBD systems:\n\nweather variables: temperature, rainfall, humidity\nhabitat/climate variables: greenness, ENSO, land use, container densities\nsocio-economic variables: bed net coverage, insecticide spraying\n\nThese may all depend on time, and can be incorporated into a model for all time dependent data (including time series!)."
+    "objectID": "VB_RegDiagTrans.html#outliers-and-studentized-residuals",
+    "href": "VB_RegDiagTrans.html#outliers-and-studentized-residuals",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "Outliers and Studentized residuals",
+    "text": "Outliers and Studentized residuals\nSince the studentized residuals are distributed \\(t_{n-p-1}(0,1)\\), we should be concerned about any \\(r_i\\) outside of about \\([-2.5, 2.5]\\).\n\n (Note: As \\(n\\) gets much bigger, we will expect to see some very rare events (big $\u000barepsilon_i$) and not get worried unless \\(|r_i| &gt; 3\\) or \\(4\\).)"
   },
   {
-    "objectID": "VB_TimeDepData.html#time-lagged-predictors",
-    "href": "VB_TimeDepData.html#time-lagged-predictors",
-    "title": "VectorByte Methods Training",
-    "section": "Time-Lagged Predictors",
-    "text": "Time-Lagged Predictors\nAdditionally, sometimes there may be a lag between an observed covariate and the response.\n\nExample: The number of people being hospitalized for dengue on a particular day reflect the number of people infected days before, and potentially mosquitoes infected days before that!\nThus, proxies of mosquito abundance, like temperature or humidity, weeks earlier may be appropriate predictors.\n\nHow can we determine an appropriate lag for a predictor?"
+    "objectID": "VB_RegDiagTrans.html#how-to-deal-with-outliers",
+    "href": "VB_RegDiagTrans.html#how-to-deal-with-outliers",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "How to deal with outliers",
+    "text": "How to deal with outliers\n\n\n\n\nfrom Research Wahlberg"
   },
   {
-    "objectID": "VB_TimeDepData.html#two-strategies",
-    "href": "VB_TimeDepData.html#two-strategies",
-    "title": "VectorByte Methods Training",
-    "section": "Two Strategies",
-    "text": "Two Strategies\nThe first is what we might call a scientific approach:\n\nUsing our system knowledge, we can define what might be feasible time lags to include in a model, given evenly sampled predictor data. We decide and include just those a priori lags, and maybe do model/feature selection to narrow down.\n\nThis approach may miss a best lag for time series data, but is often the main way we can try to find appropriate lags for unevenly sampled data.\n(Note, we almost always assume a lag of at least 1.)"
+    "objectID": "VB_RegDiagTrans.html#how-to-deal-with-outliers-1",
+    "href": "VB_RegDiagTrans.html#how-to-deal-with-outliers-1",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "How to deal with outliers",
+    "text": "How to deal with outliers\nWhen should you delete outliers?\n\nOnly when you have a really good reason!\n\nThere is nothing wrong with running a regression with and without potential outliers to see whether results are significantly impacted.\nAny time outliers are dropped, the reasons for doing so should be clearly noted.\n\nI maintain that both a statistical and a non-statistical reason are required."
   },
   {
-    "objectID": "VB_TimeDepData.html#coming-up",
-    "href": "VB_TimeDepData.html#coming-up",
-    "title": "VectorByte Methods Training",
-    "section": "Coming up!",
-    "text": "Coming up!\nThe tools here are good, but not the best:\n\nIn many situations you want to allow for \\(\\beta\\) or \\(\\sigma\\) parameters that can change in time.\nThis can leave us with some left-over autocorrelation.\nWe’ll talk more about more sophisticated models over the next couple of days."
+    "objectID": "VB_RegDiagTrans.html#outliers-leverage-and-residuals",
+    "href": "VB_RegDiagTrans.html#outliers-leverage-and-residuals",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "Outliers, leverage, and residuals",
+    "text": "Outliers, leverage, and residuals\nWarning: Unfortunately, outliers with high leverage are hard to catch through \\(\\color{dodgerblue}{r_i}\\) (since the line is pulled towards them).\nMeans get distracted by outliers…"
   },
   {
-    "objectID": "VB_TimeDepData.html#practice",
-    "href": "VB_TimeDepData.html#practice",
-    "title": "VectorByte Methods Training",
-    "section": "Practice",
-    "text": "Practice\nNow we’ll practice combining our regression tools with these additional techniques for time-dependent data.\n\nRemember:\n\nAlso ways check your residual plots to ensure that your assumptions have been met\nTransformations are your friend!\nThink carefully about how to line up your lagged predictors"
+    "objectID": "VB_RegDiagTrans.html#outliers-leverage-and-residuals-1",
+    "href": "VB_RegDiagTrans.html#outliers-leverage-and-residuals-1",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "Outliers, leverage, and residuals",
+    "text": "Outliers, leverage, and residuals\nWarning: Unfortunately, outliers with high leverage are hard to catch through \\(\\color{dodgerblue}{r_i}\\) (since the line is pulled towards them).\nConsider data on house Rents vs SqFt:\n\nPlots of \\(r_i\\) or \\(e_i\\) against \\(\\hat{Y~}_i\\) or \\(X_i\\) are still your best diagnostic!"
   },
   {
-    "objectID": "about.html",
-    "href": "about.html",
-    "title": "About the VectorByte Training Materials 2024",
-    "section": "",
-    "text": "As the VectorByte team has developed these materials, we’ve aimed to provide resources for both guided (during the workshop) and self-led learning. We assume basic familiarity with:\n\nThe R Programming Language\nBasic calculus (especially the mathematical idea of functions)\nBasic probability and statistics (e.g., what is a probability distribution, normal and binomial distributions, means, variances)\nBasics of regression\n\nWe’ve divided the materials into subject matter modules or units. Each module is designed to build on the previous one, and expects at least knowledge of all of the preceding modules in the sequence in addition to the background material.\nEach module consists of four kinds of materials:\n\nslides with presentation of materials\nlabs/hands-on materials to allow you to practice material in a practical way\nsolutions to exercises, when necessary\n\nWe also include links to additional resources/materials/references.\nFor more information about the goals and approach of VectorByte are available at vectorbyte.org."
+    "objectID": "VB_RegDiagTrans.html#normality-and-studentized-residuals",
+    "href": "VB_RegDiagTrans.html#normality-and-studentized-residuals",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "Normality and studentized residuals",
+    "text": "Normality and studentized residuals\nA more subtle issue is the normality of the distribution on \\(\\varepsilon\\).\n\nWe can look at the residuals to judge normality if \\(n\\) is big enough (say \\(&gt;20~~ \\rightarrow\\) less than that makes it too hard to call).\n\nIn particular, if we have decent size \\(\\color{red}{n}\\), we want the shape of the studentized residual distribution to “look” like \\(\\color{red}{N(0,1)}\\).\n The most obvious tactic is to look at a histogram of \\(r_i\\)."
   },
   {
-    "objectID": "VB_RegRev.html",
-    "href": "VB_RegRev.html",
-    "title": "VectorByte Methods Training",
-    "section": "",
-    "text": "Main materials"
+    "objectID": "VB_RegDiagTrans.html#assessing-normality-via-q-q-plots",
+    "href": "VB_RegDiagTrans.html#assessing-normality-via-q-q-plots",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "Assessing normality via Q-Q plots",
+    "text": "Assessing normality via Q-Q plots\nHigher fidelity diagnostics are provided by normal quantile-quantile (Q-Q) plots that:\n\nplot the sample quantiles (e.g. \\(10^{th}\\) percentile, etc.)\nagainst true percentiles from a \\(N(0,1)\\) distribution (e.g. \\(-1.96\\) is the true 2.5% quantile).\n\nIf \\(r_i \\sim N(0,1)\\) these quantiles should be equal\n\nlie on a line through 0 with slope 1"
   },
   {
-    "objectID": "VB_RegRev.html#mc-simulation-of-simple-system",
-    "href": "VB_RegRev.html#mc-simulation-of-simple-system",
-    "title": "VectorByte Methods Training",
-    "section": "MC simulation of simple system",
-    "text": "MC simulation of simple system"
+    "objectID": "VB_RegDiagTrans.html#go-to-diagnostic-plots",
+    "href": "VB_RegDiagTrans.html#go-to-diagnostic-plots",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "3 Go-To Diagnostic Plots",
+    "text": "3 Go-To Diagnostic Plots"
   },
   {
-    "objectID": "VB_RegRev.html#changes-in-population-size",
-    "href": "VB_RegRev.html#changes-in-population-size",
-    "title": "VectorByte Methods Training",
-    "section": "Changes in population size",
-    "text": "Changes in population size"
+    "objectID": "VB_RegDiagTrans.html#violations-of-slr-model-assumptions",
+    "href": "VB_RegDiagTrans.html#violations-of-slr-model-assumptions",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "Violations of SLR Model Assumptions",
+    "text": "Violations of SLR Model Assumptions\n\\[\\color{dodgerblue}{Y_i |X_i \\stackrel{ind}{\\sim} \\mathcal{N}(\\beta_0 + \\beta_1 X_i, \\sigma^2)}\\]\n\nThe conditional mean of \\(Y\\) is linear in \\(X\\).\nThe additive errors (deviations from line)\n\nare normally distributed\nindependent from each other\nidentically distributed (i.e., they have constant variance)\n\n\nAll of these can be violated! Let’s see what violations look like and how we can deal with them within the SLR framework."
   },
   {
-    "objectID": "VB_RegRev.html#sequential-observations",
-    "href": "VB_RegRev.html#sequential-observations",
-    "title": "VectorByte Methods Training",
-    "section": "Sequential observations",
-    "text": "Sequential observations\n\n\n\n\n\n\n\n\n\n\n\n\n\nIf we had just observed these data, how might we try to estimate parameters?"
+    "objectID": "VB_RegDiagTrans.html#violation-1-non-constant-variance",
+    "href": "VB_RegDiagTrans.html#violation-1-non-constant-variance",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "Violation 1: Non-constant variance",
+    "text": "Violation 1: Non-constant variance\nIf you get a trumpet shape (bunching of the \\(Y\\)s), you have nonconstant variance.\n\nThis violates our assumption that all \\(\\varepsilon_i\\) have the same \\(\\sigma^2\\)."
   },
-  {
-    "objectID": "VB_RegRev.html#sampling-distribution-of-ls-line",
-    "href": "VB_RegRev.html#sampling-distribution-of-ls-line",
-    "title": "VectorByte Methods Training",
-    "section": "Sampling distribution of LS line",
-    "text": "Sampling distribution of LS line\nWhat did we just do?\n\nWe “imagined” through simulation the sampling distribution of a LS line.\n\nIn real life we get just one data set, and we don’t know the true generating model. But we can still imagine.\n\nWe first find the sampling distribution of our LS coefficients, b_0 and b_1…\n… which requires some review.\n\nIn the online reading and review materials you should have come across some useful probability/stats facts, including:\n\n\\mathbb{E}(X_1+X_2) = \\mathbb{E}(X_1)+ \\mathbb{E}(X_2)\n\\mathbb{E}(cX_1) = c \\mathbb{E}(X_1)\n\\text{var}(c X_1) = c^2\\text{var}(X_1)\n\\text{var}(X_1+X_2) = \\text{var}(X_1)+\\text{var}(X_2) + 2\\text{cov}(X_1 X_2).\n\n\nRecall: distribution of the sample mean\n\nStep back for a moment and consider the mean for an iid sample of n observations of a random variable \\{X_1,\\ldots,X_n\\}.\n\nSuppose that \\mathbb{E}(X_i) = \\mu and \\text{var}(X_i) = \\sigma^2, then\n\n\\mathbb{E}(\\bar{X}) = \\frac{1}{n} \\sum\\mathbb{E}(X_i) = \\mu\n\\text{var}(\\bar{X}) = \\text{var}\\left( \\frac{1}{n} \\sum X_i \\right) = \\frac{1}{n^2} \\sum \\text{var}\\left( X_i \\right) = \\displaystyle \\frac{\\sigma^2}{n}."
+  {
+    "objectID": "VB_RegDiagTrans.html#solution-1-variance-stabilizing-transformations",
+    "href": "VB_RegDiagTrans.html#solution-1-variance-stabilizing-transformations",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "Solution 1: Variance stabilizing transformations",
+    "text": "Solution 1: Variance stabilizing transformations\nThis is one of the most common model violations; luckily, it is usually fixable by transforming the response (\\(Y\\)) variable.\n\\(\\color{dodgerblue}{\\log(Y)}\\) is the most common variance stabilizing transform.\n\nIf \\(Y\\) has only positive values (e.g. sales) or is a count (e.g. # of customers), take \\(\\log(Y)\\) (always natural log).\n\n\\(\\color{dodgerblue}{\\sqrt{Y}}\\) is sometimes used, especially if the data have zeros.\n\nIn general, think what you expect to be linear for your data."
   },
   {
-    "objectID": "VB_RegRev.html#central-limit-theorem",
-    "href": "VB_RegRev.html#central-limit-theorem",
-    "title": "VectorByte Methods Training",
-    "section": "Central Limit Theorem",
-    "text": "Central Limit Theorem\nThe CLT states that for iid random variables, X, with mean \\mu and variance \\sigma^2, the distribution of the sample mean becomes normal as the number of observations, n, gets large.\n\nThat is, \\displaystyle \\bar{X} \\rightarrow_{n} \\mathcal{N}(\\mu, \\sigma^2/n) , and sample averages tend to be normally distributed in large samples.\n\nWe are now ready to describe the sampling distribution of the least squares line …\n… in terms of its effect on the sampling distributions of the coefficients\n\nb_1 = \\hat{\\beta~}_1, the slope of the line\nb_0 = \\hat{\\beta~}_0, the intercept,\nand how they covary together,\n\ngiven a particular (fixed) set of X-values."
+    "objectID": "VB_RegDiagTrans.html#violation-2-nonlinear-residual-patterns",
+    "href": "VB_RegDiagTrans.html#violation-2-nonlinear-residual-patterns",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "Violation 2: Nonlinear residual patterns",
+    "text": "Violation 2: Nonlinear residual patterns\nConsider regression residuals for the 2nd Anscombe dataset:\n\nThings are not good! It appears that we do not have a linear mean function; that is \\(\\color{dodgerblue}{\\mathbb{E}[Y] \\neq \\beta_0 + \\beta_1 X}\\)."
   },
   {
-    "objectID": "VB_RegRev.html#sampling-distribution-of-b_1",
-    "href": "VB_RegRev.html#sampling-distribution-of-b_1",
-    "title": "VectorByte Methods Training",
-    "section": "Sampling distribution of b_1",
-    "text": "Sampling distribution of b_1\nIt turns out that b_1 is normally distributed: b_1 \\sim \\mathcal{N}(\\beta_1, \\sigma^2_{b_1}).\n\nb_1 is unbiased: \\mathbb{E}[b_1] = \\beta_1.\nThe sampling sd \\sigma_{b_1} determines precision of b_1: \n\\sigma_{b_1}^2\n= \\text{var}(b_1) = \\frac{\\sigma^2}{\\sum (X_i - \\bar{X})^2} = \\frac{\\sigma^2}{(n-1)s_x^2}.\n It depends on three factors: 1) sample size (n); 2) error variance (\\sigma^2 = \\sigma_\\varepsilon^2); and 3)X-spread (s_x)."
+    "objectID": "VB_RegDiagTrans.html#solution-2-polynomial-regression",
+    "href": "VB_RegDiagTrans.html#solution-2-polynomial-regression",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "Solution 2: Polynomial regression",
+    "text": "Solution 2: Polynomial regression\nEven though we are limited to a linear mean, it is possible to get nonlinear regression by transforming the \\(X\\) variable.\n\nIn general, we can add powers of \\(\\color{dodgerblue}X\\) to get polynomial regression: \\(\\color{red}{\\mathbb{E}[Y] = \\beta_0 + \\beta_1X + \\beta_2 X^2 + \\cdots + \\beta_m X^m}\\)\n\nYou can fit any mean function if \\(m\\) is big enough.\n\nUsually stick to m=2 unless you have a good reason."
   },
   {
-    "objectID": "VB_RegRev.html#sampling-distribution-of-b_0",
-    "href": "VB_RegRev.html#sampling-distribution-of-b_0",
-    "title": "VectorByte Methods Training",
-    "section": "Sampling Distribution of b_0",
-    "text": "Sampling Distribution of b_0\nThe intercept is also normal and unbiased: b_0 \\sim \\mathcal{N}(\\beta_0, \\sigma^2_{b_0}), where \n\\sigma^2_{b_0} = \\text{var}(b_0)  = \\sigma^2 \\left(\\frac{1}{n} + \\frac{\\bar{X}^2}{(n-1)\n    s_x^2} \\right).\n\nWhat is the intuition here? \n\\text{var}(\\bar{Y} - \\bar{X} b_1)\n= \\text{var}(\\bar{Y}) + \\bar{X}^2\\text{var}(b_1) {~-~ 2\\mathrm{cov}(\\bar{Y},b_1) }\n\n\n\\bar{Y} and b_1 are uncorrelated because the slope (b_1) is invariant if you shift the data up or down (\\bar{Y}).\n\n\nOptional Practice Exercise\n\nShow that:\n\n\\mathbb{E}[b_1] = \\beta_1\n\\mathbb{E}[b_0] = \\beta_0\n\\text{var}(b_0) = \\sigma^2 \\left(\\frac{1}{n} + \\frac{\\bar{X}^2}{(n-1)  s_x^2} \\right)\n\nWhy is it that b_0 and b_1 are normally distributed?"
+    "objectID": "VB_RegDiagTrans.html#testing-for-nonlinearity",
+    "href": "VB_RegDiagTrans.html#testing-for-nonlinearity",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "Testing for nonlinearity",
+    "text": "Testing for nonlinearity\nTo see if you need more nonlinearity, try the regression which includes the next polynomial term, and see if it is significant.\nFor example, to see if you need a quadratic term,\n\nfit the model then run the regression \\(\\mathbb{E}[Y] = \\beta_0 + \\beta_1 X + \\beta_2 X^2\\).\nIf your test implies \\(\\color{dodgerblue}{\\beta_2 \\neq 0}\\), you need \\(\\color{dodgerblue}{X^2}\\) in your model.\n\nNote: \\(p\\)-values are calculated “given the other \\(\\beta\\)’s are nonzero”; i.e., conditional on \\(X\\) being in the model."
   },
   {
-    "objectID": "VB_RegRev.html#joint-distribution-of-b_0-and-b_1",
-    "href": "VB_RegRev.html#joint-distribution-of-b_0-and-b_1",
-    "title": "VectorByte Methods Training",
-    "section": "Joint Distribution of b_0 and b_1",
-    "text": "Joint Distribution of b_0 and b_1\nWe know that b_0 and b_1 can be dependent, i.e., \n\\mathbb{E}[(b_0 -\\beta_0)(b_1 - \\beta_1)] \\ne 0.\n This means that estimation error in the slope is correlated with the estimation error in the intercept. \n\\mathrm{cov}(b_0,b_1) = -\\sigma^2 \\left(\\frac{\\bar{X}}{(n-1)s_x^2}\\right).\n\n\nInterpretation:\n\nUsually, if the slope estimate is too high, the intercept estimate is too low (negative correlation).\nThe correlation decreases with more X spread (s^2_x)."
+    "objectID": "VB_RegDiagTrans.html#closing-comments-on-polynomials",
+    "href": "VB_RegDiagTrans.html#closing-comments-on-polynomials",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "Closing comments on polynomials",
+    "text": "Closing comments on polynomials\n\nWe can always add higher powers (cubic, etc.) if necessary.\n\nIf you add a higher order term, the lower order term is kept in the model regardless of its individual \\(t\\)-stat.\n\nBe very careful about predicting outside the data range as the curve may do unintended things beyond the data.\nWatch out for over-fitting.\n\nYou can get a “perfect” fit with enough polynomial terms,\nbut that doesn’t mean it will be any good for prediction or understanding."
   },
   {
-    "objectID": "VB_RegRev.html#estimated-variance",
-    "href": "VB_RegRev.html#estimated-variance",
-    "title": "VectorByte Methods Training",
-    "section": "Estimated variance",
-    "text": "Estimated variance\nHowever, these formulas aren’t especially practical since they involve an unknown quantity: \\sigma.\n\nSolution: use s, the residual sample standard deviation estimator for \\sigma = \\sigma_\\varepsilon. \ns_{b_1} = \\sqrt{\\frac{s^2}{(n-1)s_x^2}} ~~~\ns_{b_0} = \\sqrt{s^2 \\left(\\frac{1}{n} + \\frac{\\bar{X}^2}{(n-1)s^2_x}\\right)}\n\ns_{b_1} = \\hat{\\sigma~}_{b_1} and s_{b_0} = \\hat{\\sigma~}_{b_0} are estimated coefficient sd’s.\n\n\nInterpretation:\n\nWe now have a notion of standard error for the LS estimates of the slope and intercept.\n\n\nSmall s_b values mean high info/precision/accuracy."
+    "objectID": "VB_RegDiagTrans.html#other-problems",
+    "href": "VB_RegDiagTrans.html#other-problems",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "Other problems",
+    "text": "Other problems\nSometimes we have other strange things going on in our data sets\n\ndata are “clumped” up in \\(X\\) – high leverage points\nresiduals still aren’t normally distributed after taking transforms from earlier\nresponses take discrete values instead of continuous\n\n\nThe latter 2 we can deal with using MLR and GLMs. What about the first?"
   },
   {
-    "objectID": "VB_RegRev.html#normal-and-student-t",
-    "href": "VB_RegRev.html#normal-and-student-t",
-    "title": "VectorByte Methods Training",
-    "section": "Normal and Student-t",
-    "text": "Normal and Student-t\nAgain, recall what Student discovered:\nIf \\theta \\sim \\mathcal{N}(\\mu,\\sigma^2), but you estimate \\sigma^2 \\approx s^2 based on n-p degrees of freedom, then \\theta \\sim t_{n-p}(\\mu, s^2).\n\nFor SLR, for example:\n\n\\bar{Y} \\sim t_{n-1}(\\mu, s_y^2/n).\nb_0 \\sim t_{n-2}\\left(\\beta_0, s^2_{b_0}\\right) and b_1 \\sim t_{n-2}\\left(\\beta_1, s^2_{b_1}\\right)\n\n\nWe can use these distributions for drawing conclusions about the parameters via:\n\nConfidence intervals\nHypothesis tests"
+    "objectID": "VB_RegDiagTrans.html#the-log-log-model",
+    "href": "VB_RegDiagTrans.html#the-log-log-model",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "The log-log model",
+    "text": "The log-log model\nThe other common covariate transform is \\(\\log(X)\\).\n\nWhen \\(X\\)-values are bunched up, \\(\\log(X)\\) helps spread them out and reduces the leverage of extreme values.\nRecall that both reduce \\(s_{b_1}\\).\n\nIn practice, this is often used in conjunction with a \\(\\log(Y)\\) response transformation. The log-log model is \\[\n    \\color{red}{\\log(Y) = \\beta_0 + \\beta_1 \\log(X) + \\varepsilon}.\n    \\]\nIt is super useful, and has some special properties …"
   },
   {
-    "objectID": "Stats_review.html",
-    "href": "Stats_review.html",
-    "title": "VectorByte Methods Training",
-    "section": "",
-    "text": "Main materials\nSolutions to exercises"
+    "objectID": "VB_RegDiagTrans.html#elasticity-and-the-log-log-model",
+    "href": "VB_RegDiagTrans.html#elasticity-and-the-log-log-model",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "Elasticity and the log-log model",
+    "text": "Elasticity and the log-log model\nIn a log-log model, the slope \\(\\beta_1\\) is sometimes called elasticity.\nThe elasticity is (roughly) % change in \\(Y\\) per 1% change in \\(X\\). \\[\\color{dodgerblue}{\n\\beta_1 \\approx \\frac{d\\%Y}{d\\%X}}\\] For example, economists often assume that GDP has import elasticity of 1. Indeed:\n\nGDPlm&lt;-lm(log(GDP) ~ log(IMPORTS))\ncoef(GDPlm)\n#&gt;  (Intercept) log(IMPORTS) \n#&gt;     1.891516     0.969337\n\n\n(Can we test for 1%?)"
   },
   {
-    "objectID": "Stats_review.html#some-probability-notation",
-    "href": "Stats_review.html#some-probability-notation",
-    "title": "VectorByte Methods Training",
-    "section": "Some probability notation",
-    "text": "Some probability notation\nWe have a set, S of all possible events. Let \\text{Pr}(A) (or alternatively \\text{Prob}(A)) be the probability of event A. Then:\n\nA^c is the complement to A (all events that are not A).\nA \\cup B is the union of events A and B (“A or B”).\nA \\cap B is the intersection of events A and B (“A and B”).\n\\text{Pr}(A|B) is the conditional probability of A given that B occurs."
+    "objectID": "VB_RegDiagTrans.html#practical",
+    "href": "VB_RegDiagTrans.html#practical",
+    "title": "Review of Diagnostics and Transformations for Regression Models",
+    "section": "Practical",
+    "text": "Practical\nNext we’ll do a short practical to practice:\n\nFitting linear models in R\nChecking diagnostics\nChoosing transformations\nPlotting predictions"
   },
   {
-    "objectID": "Stats_review.html#axioms-of-probability",
-    "href": "Stats_review.html#axioms-of-probability",
-    "title": "VectorByte Methods Training",
-    "section": "Axioms of Probability",
-    "text": "Axioms of Probability\nThese are the basic definitions that we use when we talk about probabilities. You’ve probably seen these before, but maybe not in mathematical notation. If the notation is new to you, I suggest that you use the notation above to translate these statements into words and confirm that you understand what they mean. I give you an example for the first statement.\n\n\\sum_{i \\in S} \\text{Pr}(A_i)=1, where 0 \\leq \\text{Pr}(A_i) \\leq 1 (the probabilities of all the events that can happen must sum to one, and all of the individual probabilities must be less than one)\n\\text{Pr}(A)=1-\\text{Pr}(A^c)\n\\text{Pr}(A \\cup B) = \\text{Pr}(A) + \\text{Pr}(B) -\\text{Pr}(A \\cap B)\n\\text{Pr}(A \\cap B) = \\text{Pr}(A|B)\\text{Pr}(B)\nIf A and B are independent, then \\text{Pr}(A|B) = \\text{Pr}(A)"
+    "objectID": "VB_RegDiagTrans_practical.html#fit-the-linear-regression-model.-plot-the-data-and-fitted-line.",
+    "href": "VB_RegDiagTrans_practical.html#fit-the-linear-regression-model.-plot-the-data-and-fitted-line.",
+    "title": "VectorByte Methods Training: Regression Diagnostics and Transformations (practical)",
+    "section": "1. Fit the linear regression model. Plot the data and fitted line.",
+    "text": "1. Fit the linear regression model. Plot the data and fitted line.\n\n## fit models\nlm1 &lt;- lm(Y1 ~ X1)\n\n## plot points and fitted lines\nplot(X1, Y1, col=1, main=\"I\"); abline(lm1, col=2)"
   },
   {
-    "objectID": "Stats_review.html#bayes-theorem",
-    "href": "Stats_review.html#bayes-theorem",
-    "title": "VectorByte Methods Training",
-    "section": "Bayes Theorem",
-    "text": "Bayes Theorem\nBayes Theorem allows us to related the conditional probabilities of two events A and B:\n\\begin{align*}\n\\text{Pr}(A|B) & = \\frac{\\text{Pr}(B|A)\\text{Pr}(A)}{\\text{Pr}(B)}\\\\\n&\\\\\n& =  \\frac{\\text{Pr}(B|A)\\text{Pr}(A)}{\\text{Pr}(B|A)\\text{Pr}(A) + \\text{Pr}(B|A^c)\\text{Pr}(A^c)}\n\\end{align*}"
+    "objectID": "VB_RegDiagTrans_practical.html#provide-a-scatterplot-normal-q-q-plot-and-histogram-for-the-studentized-regression-residuals.",
+    "href": "VB_RegDiagTrans_practical.html#provide-a-scatterplot-normal-q-q-plot-and-histogram-for-the-studentized-regression-residuals.",
+    "title": "VectorByte Methods Training: Regression Diagnostics and Transformations (practical)",
+    "section": "2. Provide a scatterplot, normal Q-Q plot, and histogram for the studentized regression residuals.",
+    "text": "2. Provide a scatterplot, normal Q-Q plot, and histogram for the studentized regression residuals.\n\npar(mfrow=c(1,3), mar=c(4,4,2,0.5))   \n\n## studentized residuals vs fitted\nplot(lm1$fitted, rstudent(lm1), col=1,\n     xlab=\"Fitted Values\", \n     ylab=\"Studentized Residuals\", \n     pch=20, main=\"I\")\n\n## qq plot of studentized residuals\nqqnorm(rstudent(lm1), pch=20, col=1, main=\"\" )\nabline(a=0,b=1,lty=2, col=2)\n\n## histogram of studentized residuals\nhist(rstudent(lm1), col=1, \n     xlab=\"Studentized Residuals\", \n     main=\"\", border=8)"
   },
   {
-    "objectID": "Stats_review.html#discrete-rvs-and-their-probability-distributions",
-    "href": "Stats_review.html#discrete-rvs-and-their-probability-distributions",
-    "title": "VectorByte Methods Training",
-    "section": "Discrete RVs and their Probability Distributions",
-    "text": "Discrete RVs and their Probability Distributions\nMany things that we observe are naturally discrete. For instance, whole numbers of chairs or win/loss outcomes for games. Discrete probability distributions are used to describe these kinds of events.\nFor discrete RVs, the distribution of probabilities is described by the probability mass function (pmf), f_k such that:\n\\begin{align*}\nf_k  \\equiv \\text{Pr}(X & = k) \\\\\n\\text{where } 0\\leq f_k \\leq 1 & \\text{ and } \\sum_k f_k = 1\n\\end{align*}\nFor example, for a fair 6-sided die:\nf_k = 1/6 for k= \\{1,2,3,4,5,6\\}.\n\\star Question 1: For the six-sided fair die, what is f_k if k=7? k=1.5?\nRelated to the pmf is the cumulative distribution function (cdf), F(x). F(x) \\equiv \\text{Pr}(X \\leq x)\nFor the 6-sided die F(x)= \\displaystyle\\sum_{k=1}^{x} f_k\nwhere x \\in 1\\dots 6.\n\\star Question 2: For the fair 6-sided die, what is F(3)? F(7)? F(1.5)?\n\nVisualizing distributions of discrete RVs in R\nExample: Imagine a RV can take values 1 through 10, each with probability 0.1:\n \n\nvals&lt;-seq(1,10, by=1)\npmf&lt;-rep(0.1, 10)\ncdf&lt;-pmf[1]\nfor(i in 2:10) cdf&lt;-c(cdf, cdf[i-1]+pmf[i])\npar(mfrow=c(1,2), bty=\"n\")\nbarplot(height=pmf, names.arg=vals, ylim=c(0, 1), main=\"pmf\", col=\"blue\")\nbarplot(height=cdf, names.arg=vals, ylim=c(0, 1), main=\"cdf\", col=\"red\")"
+    "objectID": "VB_RegDiagTrans_practical.html#using-the-residual-scatterplots-state-how-the-slr-model-assumptions-are-violated.",
+    "href": "VB_RegDiagTrans_practical.html#using-the-residual-scatterplots-state-how-the-slr-model-assumptions-are-violated.",
+    "title": "VectorByte Methods Training: Regression Diagnostics and Transformations (practical)",
+    "section": "3. Using the residual scatterplots, state how the SLR model assumptions are violated.",
+    "text": "3. Using the residual scatterplots, state how the SLR model assumptions are violated.\nXs are clumpy AND the variance seems non-constant. It looks a lot like the GDP data from class. Since both Xs and Ys are strictly positive, we can try a log-log transform."
   },
   {
-    "objectID": "Stats_review.html#continuous-rvs-and-their-probability-distributions",
-    "href": "Stats_review.html#continuous-rvs-and-their-probability-distributions",
-    "title": "VectorByte Methods Training",
-    "section": "Continuous RVs and their Probability Distributions",
-    "text": "Continuous RVs and their Probability Distributions\nThings are just a little different for continuous RVs. Instead we use the probability density function (pdf) of the RV, and denote it by f(x). It still describes how relatively likely are alternative values of an RV – that is, if the pdf his higher around one value than around another, then the first is more likely to happen. However, the pdf does not return a probability, it is a function that describes the probability density.\nAn analogy:\nProbabilities are like weights of objects. The PMF tells you how much weight each possible value or outcome contributes to a whole. The PDF tells you how dense it is around a value. To calculate the weight of a real object, you need to also know the size of the area that you’re interested in and the density there The probability that your RV takes exactly any value is zero, just like the probability that any atom in a very thin wire is lined up at exactly that position is zero (and to the amount of mass at that location is zero). However, you can take a very thin slice around that location to see how much material is there.\nRelated to the pdf is the cumulative distribution function (cdf), F(x). \nF(x) \\equiv \\text{Pr}(X \\leq x)\n For a continuous distribution: \nF(x)= \\int_{-\\infty}^x f(x')dx'\n\n \n For a normal distribution with mean 0, what is F(0)?\n \n\nVisualizing distributions of continuous RVs in R\nExample: exponential RV, where f(x) = re^{-rx}:\n\n\nvals&lt;-seq(0,10, length=1000)\nr&lt;-0.5\npar(mfrow=c(1,2), bty=\"n\")\nplot(vals, dexp(vals, rate=r), main=\"pdf\", col=\"blue\", type=\"l\", lwd=3, ylab=\"\", xlab=\"\")\nplot(vals, pexp(vals, rate=r), main=\"cdf\", ylim=c(0,1), col=\"red\",\n     type=\"l\", lwd=3, ylab=\"\", xlab=\"\")"
+    "objectID": "VB_RegDiagTrans_practical.html#determine-the-data-transformation-to-correct-the-problems-in-3-fit-the-corresponding-regression-model-and-plot-the-transformed-data-with-new-fitted-line.",
+    "href": "VB_RegDiagTrans_practical.html#determine-the-data-transformation-to-correct-the-problems-in-3-fit-the-corresponding-regression-model-and-plot-the-transformed-data-with-new-fitted-line.",
+    "title": "VectorByte Methods Training: Regression Diagnostics and Transformations (practical)",
+    "section": "4. Determine the data transformation to correct the problems in 3, fit the corresponding regression model, and plot the transformed data with new fitted line.",
+    "text": "4. Determine the data transformation to correct the problems in 3, fit the corresponding regression model, and plot the transformed data with new fitted line.\n\n### the fix is as follows:\nlogX1&lt;- log(X1)\nlogY1 &lt;- log(Y1)\n\n### re-run the regressions and residual plots to show this worked\nlm1 &lt;- lm(logY1 ~ logX1)\n\n## plot points and lines\nplot(logX1, logY1, col=1, main=\"I\"); abline(lm1, col=2)"
   },
   {
-    "objectID": "Stats_review.html#confidence-intervals",
-    "href": "Stats_review.html#confidence-intervals",
-    "title": "VectorByte Methods Training",
-    "section": "Confidence Intervals",
-    "text": "Confidence Intervals\nSuppose Z_{n-p} \\sim t_{n-p}(0,1). A centered interval is on this t distribution can be written as: \\text{Pr}(-t_{n-p,\\alpha/2} \\&lt; Z\\_{n-p} \\&lt; t_{n-p,\\alpha/2}) = 1-\\alpha. That is, between these values of the t distribution (1-\\alpha)\\times 100 percent of the probability is contained in that symmetric interval. We can visually indicate these location on a plot of the t distribution (here with df=5 and \\alpha=0.05):\n\nx&lt;-seq(-4.5, 4.5, length=1000)\nalpha=0.05\n\n## draw a line showing the normal pdf on the histogram\nplot(x, dt(x, df=5), col=\"black\", lwd=2, type=\"l\", xlab=\"x\", ylab=\"\")\nabline(v=qt(alpha/2, df=5), col=3, lty=2, lwd=2)\nabline(v=qt(1-alpha/2, df=5), col=2, lty=2, lwd=2)\n\nlegend(\"topright\", \n       legend=c(\"t, df=5\", \"lower a/2\", \"upper a/2\"),\n       col=c(1,3,2), lwd=2, lty=c(1, 2,2))\n\n\n\n\n\n\n\n\nIn the R code here, {\\tt qt} is the Student-t “quantile function”. The function {\\tt qt(alpha, df)} returns a value z such that \\alpha = P(Z_{\\mathrm{df}} &lt; z), i.e., t_{\\mathrm{df},\\alpha}.\nHow can we use this to determine the confidence interval for \\theta? Since \\theta \\sim t_{n-p}(\\mu, s^2), we can replace the Z_{n-p} in the interval above with the definition in terms of \\theta, \\mu and s and rearrange: \\begin{align*}\n1-\\alpha& = \\text{Pr}\\left(-t_{n-p,\\alpha/2} &lt; \\frac{\\mu - \\bar{\\theta}}{s} &lt;\nt_{n-p,\\alpha/2}\\right) \\\\\n&=\n\\text{Pr}(\\bar{\\theta}-t_{n-p,\\alpha/2}s &lt; \\mu &lt;\n\\bar{\\theta} + t_{n-p,\\alpha/2}s)\n\\end{align*}\nThus (1-\\alpha)*100% of the time, \\mu is within the confidence interval (written in two equivalent ways):\n\\bar{\\theta} \\pm t_{n-p,\\alpha/2} \\times s \\;\\;\\; \\Leftrightarrow \\;\\;\\; \\bar{\\theta}-t_{n-p,\\alpha/2} \\times s, \\bar{\\theta} + t_{n-p,\\alpha/2}\\times s\nWhy should we care about confidence intervals?\n\nThe confidence interval captures the amount of information in the data about the parameter.\nThe center of the interval tells you what your estimate is.\nThe length of the interval tells you how sure you are about your estimate."
+    "objectID": "VB_RegDiagTrans_practical.html#provide-plots-to-show-that-your-transformations-have-mostly-fixed-the-model-violations.",
+    "href": "VB_RegDiagTrans_practical.html#provide-plots-to-show-that-your-transformations-have-mostly-fixed-the-model-violations.",
+    "title": "VectorByte Methods Training: Regression Diagnostics and Transformations (practical)",
+    "section": "5. Provide plots to show that your transformations have (mostly) fixed the model violations.",
+    "text": "5. Provide plots to show that your transformations have (mostly) fixed the model violations.\n\n## studentized residuals vs fitted\n\npar(mfrow=c(1,3), mar=c(4,4,2,0.5))  \nplot(lm1$fitted, rstudent(lm1), col=1,\n     xlab=\"Fitted Values\", \n     ylab=\"Studentized Residuals\", \n     pch=20, main=\"I\")\n\n## Q-Q plots\nqqnorm(rstudent(lm1), pch=20, col=1, main=\"\" )\nabline(a=0,b=1,lty=2, col=2)\n\n## histograms of studentized residuals\nhist(rstudent(lm1), col=1, \n     xlab=\"Studentized Residuals\", \n     main=\"\", border=8)\n\n\n\n\n\n\n\n\nThis is much better! The histogram still maybe looks a little funny, but given that the qq-plot looks pretty good, I think we’ve made a good transformation."
   },
   {
-    "objectID": "Stats_review.html#p-values",
-    "href": "Stats_review.html#p-values",
-    "title": "VectorByte Methods Training",
-    "section": "p-Values",
-    "text": "p-Values\nWhat is a p-value? The American Statistical Association issued a statement where they defined it in the following way:\n“Informally, a p-value is the probability under a specified statistical model that a statistical summary of the data (e.g., the sample mean difference between two compared groups) would be equal to or more extreme than its observed value.” (ASA Statement on Statistical Significance and P-Values.)\nMore formally, we formulate a p-value in terms of a null hypothesis/model and test whether or not our observed data are more extreme than we would expect under that specific null model. In your previous courses you’ve probably seen very specific null models, corresponding to, for instance the null hypothesis that the mean of your data is normally distributed with mean m (often m=0). We often denote the null model as H_0 and the alternative as H_a or H_1. For instance, for our example above with \\theta we might want to test the following:\nH_0: \\bar{\\theta}=0 \\;\\;\\; \\text{vs.} \\;\\;\\; H_a: \\bar{\\theta}\\neq 0\nTo perform the hypothesis test we would FIRST choose our rejection level, \\alpha. Although convention is to use \\alpha =0.05 corresponding to a 95% confidence region, one could choose based on how sure one needs to be for a particular application. Next we build our test statistic. There are two cases, first if we know \\sigma and second if we don’t.\nIf we knew the variance \\sigma^2, our test statistic would be Z=\\frac{\\bar{\\theta}-0}{\\sigma}, and we expect that this should have a standard normal distribution, i.e., Z\\sim\\mathcal{N}(0,1). If we don’t know \\sigma and instead estimate is as s (which is most of the time), our test statistic would be Z_{df}=\\frac{\\bar{\\theta}-0}{s} (i.e., it would have a t-distribution).\nWe calculate the value of the appropriate statistic (either Z or Z_{df}) for our data, and then we compare it to the values of the standard distribution (normal or t, respectively) corresponding to the \\alpha level that we chose, i.e., we see if the number that we got for our statistic is inside the horizontal lines that we drew on the standard distribution above. If it is, then the data are consistent with the null hypothesis and we cannot reject the null. If the statistic is outside the region the data are NOT consistent with the null, and instead we reject the null and use the alternative as our new working hypothesis.\nNotice that this process is focused on the null hypothesis. We cannot tell if the alternative hypothesis is true, or, really, if it’s actually better than the null. We can only say that the null is not consistent with our data (i.e., we can falsify the null) at a given level of certainty.\nAlso, the hypothesis testing process is the same as building a confidence interval, as above, and then seeing if the null hypothesis is within your confidence interval. If the null is outside of your confidence interval then you can reject your null at the level of certainty corresponding to the \\alpha that you used to build your CI. If the value for the null is within your CI, you cannot reject at that level."
+    "objectID": "VB_RegDiagTrans_practical.html#your-turn",
+    "href": "VB_RegDiagTrans_practical.html#your-turn",
+    "title": "VectorByte Methods Training: Regression Diagnostics and Transformations (practical)",
+    "section": "Your Turn!",
+    "text": "Your Turn!\nRepeat this process with the other 3 datasets, and see if you can figure out a appropriate transformations for each dataset."
   },
   {
-    "objectID": "Stats_review.html#the-sampling-distribution-1",
-    "href": "Stats_review.html#the-sampling-distribution-1",
-    "title": "VectorByte Methods Training",
-    "section": "The Sampling Distribution",
-    "text": "The Sampling Distribution\nSuppose we have a random sample \\{Y_i, i=1,\\dots,N \\}, where Y_i \\stackrel{\\mathrm{i.i.d.}}{\\sim}N(\\mu,9) for i=1,\\ldots,N.\n\nWhat is the variance of the sample mean?\nWhat is the expectation of the sample mean?\nWhat is the variance for another i.i.d. realization Y_{ N+1}?\nWhat is the standard error of \\bar{Y}?"
+    "objectID": "VB_TimeDepData.html#learning-objectives",
+    "href": "VB_TimeDepData.html#learning-objectives",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Learning Objectives",
+    "text": "Learning Objectives"
   },
   {
-    "objectID": "Stats_review.html#hypothesis-testing-and-confidence-intervals",
-    "href": "Stats_review.html#hypothesis-testing-and-confidence-intervals",
-    "title": "VectorByte Methods Training",
-    "section": "Hypothesis Testing and Confidence Intervals",
-    "text": "Hypothesis Testing and Confidence Intervals\nSuppose we sample some data \\{Y_i, i=1,\\dots,n \\}, where Y_i \\stackrel{\\mathrm{i.i.d.}}{\\sim}N(\\mu,\\sigma^2) for i=1,\\ldots,n, and that you want to test the null hypothesis H_0: ~\\mu=12 vs. the alternative H_a: \\mu \\neq 12, at the 0.05 significance level.\n\nWhat test statistic would you use? How do you estimate \\sigma?\nWhat is the distribution for this test statistic if the null is true?\nWhat is the distribution for the test statistic if the null is true and n \\rightarrow \\infty?\nDefine the test rejection region. (I.e., for what values of the test statistic would you reject the null?)\nHow would compute the p-value associated with a particular sample?\nWhat is the 95% confidence interval for \\mu? How should one interpret this interval?\nIf \\bar{Y} = 11, s_y = 1, and n=9, what is the test result? What is the 95% CI for \\mu?"
+    "objectID": "VB_TimeDepData.html#time-dependent-data",
+    "href": "VB_TimeDepData.html#time-dependent-data",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Time Dependent Data",
+    "text": "Time Dependent Data\nMuch of the data we collect in VBD applications depends on time such as\n\nobserved cases in a city or country\nnumber of mosquitoes over time\n\nAdditionally, we often assume that the reasons these change over time may be because covariates (e.g., temperature, precipitation, insecticide spraying) change over time.\nHow do we incorporate these time varying factors into our regression models?"
   },
   {
-    "objectID": "GP.html#gaussian-process-introduction",
-    "href": "GP.html#gaussian-process-introduction",
-    "title": "VectorByte Methods Training",
-    "section": "Gaussian Process: Introduction",
-    "text": "Gaussian Process: Introduction\n\n\nA Gaussian Process model is a non paramteric and flexible regression model\nIt started being used in the field of spatial statistics, where it is called kriging.\nIt is also widely used in the field of machine learning since it makes fast predictions and gives good uncertainty quantification commonly used as a surrogate model.\n\n\n\nSurrogate Models: Imagine a case where field experiments are infeasible and computer experiments take a long time to run, we can approximate the computer experiments using a surrogate model.\n\nThe ability to this model to provide good UQ makes it very useful in other fields such as ecology where the data is sparse and noisy and therefore good uncertainty measures are paramount."
+    "objectID": "VB_TimeDepData.html#types-of-time-dependent-data",
+    "href": "VB_TimeDepData.html#types-of-time-dependent-data",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Types of time dependent data",
+    "text": "Types of time dependent data\nThe most common type of time-dependent data that statisticians talk about is time series data. These are data where observations are evenly spaced with no (or very little) missing observations.\n\nAlthough evenly spaced data are ideal (and the most common methods are designed for them), in VBD survey data we often don’t have evenly spaced observations. These data don’t have a specific name, and most time-series methods can’t be directly used with them."
   },
   {
-    "objectID": "GP.html#what-is-a-gp",
-    "href": "GP.html#what-is-a-gp",
-    "title": "VectorByte Methods Training",
-    "section": "What is a GP?",
-    "text": "What is a GP?\n\n\nHere, we assume that the data come from a Multivariate Normal Distribution (MVN).\nAny normal distribution can be described by a mean vector \\mu and a covariance matrix \\Sigma.\nWe then make predictions conditional on the data.\n\n\n\n\nMathematically, we can write it as,\n\nY_{\\ n \\times 1} \\sim N \\ ( \\ \\mu(X)_{\\ n \\times 1} \\ , \\ \\Sigma(X)_{ \\ n \\times n} \\ ) Here, Y is the response of interest and n is the number of observations.\n\n\n\nOur goal is to find Y_p \\ \\vert \\ Y, X which will also be a Normal distribution.\nTo understand how it works, let’s first visualize this concept and then look into the math"
+    "objectID": "VB_TimeDepData.html#time-series-data-and-dependence",
+    "href": "VB_TimeDepData.html#time-series-data-and-dependence",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Time series data and dependence",
+    "text": "Time series data and dependence\nTime-series data are simply a collection of observations gathered over time. For example, suppose \\(y_1, \\ldots, y_T\\) are\n\ndaily temperature,\nsolar activity,\nCO\\(_2\\) levels,\nyearly population size.\n\nIn each case, we might expect what happens at time \\(t\\) to be correlated with time \\(t-1\\)."
   },
   {
-    "objectID": "GP.html#visualizing-a-gp",
-    "href": "GP.html#visualizing-a-gp",
-    "title": "VectorByte Methods Training",
-    "section": "Visualizing a GP",
-    "text": "Visualizing a GP\n\n\n\n\n\n\n\n\n\n\n\n\n\nWe are using points closer to each other to correlate the responses.\nWhile making predictions, we average over the data around the points."
+    "objectID": "VB_TimeDepData.html#checking-for-dependence",
+    "href": "VB_TimeDepData.html#checking-for-dependence",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Checking for dependence",
+    "text": "Checking for dependence\nTo see if \\(Y_{t-1}\\) would be useful for predicting \\(Y_t\\), just plot them together and see if there is a relationship.\n\n\n\n\n\n\n\n\n\n\n\n\n\n\nCorrelation between \\(Y_t\\) and \\(Y_{t-1}\\) is called autocorrelation."
   },
   {
-    "objectID": "GP.html#how-does-a-gp-work",
-    "href": "GP.html#how-does-a-gp-work",
-    "title": "VectorByte Methods Training",
-    "section": "How does a GP work",
-    "text": "How does a GP work\n\n\nAs we saw, we are averaging the data “nearby”… How do you define that?\n\n\n\n\nThis indicates that we are using distance in some way. Where…?\n\n\n\n\nRecall that in Linear Regression, you have \\ \\Sigma \\  = \\sigma^2 \\mathbb{I}\nFor a GP, the covariance matrix ( \\Sigma ) is defined by a kernel.\nConsider,\n\n\\Sigma_n = \\tau^2 C_n where C_n = \\exp \\left( - \\vert \\vert x - x' \\vert \\vert^2 \\right), and x and x' are input locations.\n\n\n\nThe covariance structure now depends on how close together the inputs. If inputs are close in distance, then the responses are more highly correlated.\nThe covariance will decay at an exponential rate as x moves away from x'."
+    "objectID": "VB_TimeDepData.html#autocorrelation-for-time-series-data",
+    "href": "VB_TimeDepData.html#autocorrelation-for-time-series-data",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Autocorrelation (for time series data)",
+    "text": "Autocorrelation (for time series data)\nTo summarize the time-varying dependence, compute lag-\\(\\ell\\) correlations for \\(\\ell=1,2,3,\\ldots\\)\nIn general, the autocorrelation function (ACF) for \\(Y\\) is \\[\\color{red}{r(\\ell) = \\mathrm{cor}(Y_t, Y_{t-\\ell})}\\]\nFor our Roanoke temperature data:\n\nprint(acf(weather$temp))\n\n     0      1      2      3      4      5      6      7      8    \n 1.000  0.658  0.298  0.263  0.297  0.177  0.111  0.008 -0.099   \n    9     10    11     12     13     14     15     16     17 \n-0.045 0.071 -0.020 -0.157 -0.156 -0.146 -0.278 -0.346 -0.314"
   },
   {
-    "objectID": "GP.html#how-to-make-predictions",
-    "href": "GP.html#how-to-make-predictions",
-    "title": "VectorByte Methods Training",
-    "section": "How to make predictions",
-    "text": "How to make predictions\n\n\nNow we will learn how to use a GP to make predictions at new locations.\nAs we learnt, we condition on the data. We can think of this as the prior.\n\n\\begin{equation}\nY_n \\ \\vert X_n \\sim \\mathcal{N} \\ ( \\ 0 \\ , \\ \\tau^2 \\ C_n(X)  \\ ) \\\\\n\\end{equation}\n\n\nNow, consider, (\\mathcal{X}, \\mathcal{Y}) as the predictive set.\n\nThe goal is to find the distribution of \\mathcal{Y} \\ \\vert X_n, Y_n which in this case is the posterior distribution.\nBy properties of Normal distribution, the posterior is also normally distributed.\n\n\n\nWe also need to write down the mean and variance of the posterior distribution so it’s ready for use."
+    "objectID": "VB_TimeDepData.html#autoregression",
+    "href": "VB_TimeDepData.html#autoregression",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Autoregression",
+    "text": "Autoregression\nHow do we model data that exhibits autocorrelation?\nSuppose \\(Y_1 = \\varepsilon_1\\), \\(Y_2 = \\varepsilon_{1} + \\varepsilon_{2}\\), \\(Y_3 = \\varepsilon_{1} + \\varepsilon_{2} + \\varepsilon_{3}\\), etc.\n\nThen \\(\\color{dodgerblue}{Y_t =  \\sum_{i=1}^{t}\\varepsilon_i = Y_{t-1} + \\varepsilon_t}\\) and \\(\\color{dodgerblue}{ \\mathbb{E}[Y_t] = Y_{t-1}}\\).\n\nThis is called a random walk model for \\(Y_t\\):\n\nthe expectation of what will happen is always what happened most recently."
   },
   {
-    "objectID": "GP.html#how-to-make-predictions-1",
-    "href": "GP.html#how-to-make-predictions-1",
-    "title": "VectorByte Methods Training",
-    "section": "How to make predictions",
-    "text": "How to make predictions\n\n\nFirst we will “stack” the predictions and the data.\n\n\\begin{equation}\n\\begin{bmatrix}\n\\mathcal{Y} \\\\\nY_n \\\\\n\\end{bmatrix}\n\\ \\sim \\ \\mathcal{N}\n\\left(\n\\;\n\\begin{bmatrix}\n0 \\\\\n0 \\\\\n\\end{bmatrix}\\; , \\;\n\\begin{bmatrix}\n\\Sigma(\\mathcal{X}, \\mathcal{X}) & \\Sigma(\\mathcal{X}, X_n)\\\\\n\\Sigma({X_n, \\mathcal{X}}) &  \\Sigma_n\\\\\n\\end{bmatrix}\n\\;\n\\right)\n\\\\[5pt]\n\\end{equation}\n\n\n\nNow, let’s denote the predictive mean with \\mu(\\mathcal{X}) and predictive variance with \\sigma^2(\\mathcal{X})\n\n\\begin{equation}\n\\mathcal{Y} \\mid Y_n, X_n \\sim N\\left(\\mu(\\mathcal{X}) \\ , \\ \\sigma^2(\\mathcal{X})\\right)\n\\end{equation}\n\n\n\nWe will apply the properties of conditional Normal distributions.\n\n\\begin{equation}\n\\begin{aligned}\n\\mu(\\mathcal{X}) & = \\Sigma(\\mathcal{X}, X_n) \\Sigma_n^{-1} Y_n \\\\\n\\sigma^2(\\mathcal{X}) & = \\Sigma(\\mathcal{X}, \\mathcal{X}) - \\Sigma(\\mathcal{X}, X_n) \\Sigma_n^{-1} \\Sigma(X_n, \\mathcal{X}) \\\\\n\\end{aligned}\n\\end{equation}"
+    "objectID": "VB_TimeDepData.html#random-walk",
+    "href": "VB_TimeDepData.html#random-walk",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Random walk",
+    "text": "Random walk\nIn a random walk, the series just wanders around.\n\n\\(\\beta_1 = 1\\)"
   },
   {
-    "objectID": "GP.html#hyper-parameters",
-    "href": "GP.html#hyper-parameters",
-    "title": "VectorByte Methods Training",
-    "section": "Hyper Parameters",
-    "text": "Hyper Parameters\n\n\nA GP is non parameteric, however, has some hyper-parameters as is the case with any Bayesian setup.\n\nOne of the most common kernels which we will focus on is the squared exponential distance kernel written as\nC_n = \\exp{ \\left( -\\frac{\\vert\\vert x - x' \\vert \\vert ^2}{\\theta} \\right ) + g \\mathbb{I_n}} \n\n\nRecall, \\Sigma_n = \\tau^2 C_n\nWe have three main parameters here:\n\n\\tau^2: Scale\n\\theta: Length-scale\ng: Nugget"
+    "objectID": "VB_TimeDepData.html#exploding-series",
+    "href": "VB_TimeDepData.html#exploding-series",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Exploding series",
+    "text": "Exploding series\nFor AR term \\(&gt;1\\), the \\(Y_t\\)’s move exponentially far from \\(Y_1\\).\n\n\\(\\beta_1 = 1.02\\)\n\n\n\nUseless for modeling and prediction."
   },
   {
-    "objectID": "GP.html#scale",
-    "href": "GP.html#scale",
-    "title": "VectorByte Methods Training",
-    "section": "Scale",
-    "text": "Scale\n\n\nThis parameter can be used to adjust the amplitude of the data.\nA random draw from a multivariate normal distribution with \\tau^2 = 1 will produce data between -2 and 2.\n\n\n\n\nNow let’s visualize what happens when we increase \\tau^2 to 25."
+    "objectID": "VB_TimeDepData.html#stationary-series",
+    "href": "VB_TimeDepData.html#stationary-series",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Stationary series",
+    "text": "Stationary series\nFor \\(\\beta_1&lt;1\\), \\(Y_t\\) is always pulled back towards the mean.\n\n\\(\\beta_1 = 0.8\\)\n\n\n\nThese are the most common and useful type of AR series."
   },
   {
-    "objectID": "GP.html#length-scale",
-    "href": "GP.html#length-scale",
-    "title": "VectorByte Methods Training",
-    "section": "Length-scale",
-    "text": "Length-scale\n\n\nThis parameter controls the rate of decay of correlation.\nLarger \\theta will result in wigglier functions.\n\n\n\nLet’s also visualize different values of \\theta."
+    "objectID": "VB_TimeDepData.html#mean-reversion",
+    "href": "VB_TimeDepData.html#mean-reversion",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Mean reversion",
+    "text": "Mean reversion\nAn important property of stationary series is mean reversion.\nThink about shifting both \\(Y_t\\) and \\(Y_{t-1}\\) by their mean \\(\\mu\\). \\[\n\\color{dodgerblue}{Y_t - \\mu = \\beta_1 (Y_{t-1} - \\mu) +\\varepsilon_t}\n\\] Since \\(|\\beta_1| &lt; 1\\), \\(Y_t\\) is expected to be closer to \\(\\mu\\) than \\(Y_{t-1}\\).\nMean reversion is all over, and helps predict future behavior:\n\nweekly sales numbers,\ndaily temperature."
   },
   {
-    "objectID": "GP.html#nugget",
-    "href": "GP.html#nugget",
-    "title": "VectorByte Methods Training",
-    "section": "Nugget",
-    "text": "Nugget\n\n\nIt is responsible for introducing noise into the covariance structure so there is some discontinuity in the data.\nWe will compare a sample from g ~ 0 (&lt; 1e-8 for numeric stability) vs g = 0.1 to observe what actually happens.\n\n\n\n\n\n\n\n\n\n\n\n\n\nThis parameter prevents interpolation which in turn yields better UQ."
+    "objectID": "VB_TimeDepData.html#negative-correlation",
+    "href": "VB_TimeDepData.html#negative-correlation",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Negative correlation",
+    "text": "Negative correlation\nIt is also possible to have negatively correlated AR(1) series.\n\n\\(\\beta_1 = -0.8\\)\n\n\n\nBut you see these far less often in practice."
   },
   {
-    "objectID": "GP.html#toy-example-1d-example",
-    "href": "GP.html#toy-example-1d-example",
-    "title": "VectorByte Methods Training",
-    "section": "Toy Example (1D Example)",
-    "text": "Toy Example (1D Example)\n\n\n\nX &lt;- matrix(seq(0, 2*pi, length = 100), ncol =1)\nn &lt;- nrow(X) \ntrue_y &lt;- 5 * sin(X)\nobs_y &lt;- true_y + rnorm(n, sd=1)\n\npar(mfrow = c(1, 1), mar = c(5, 5, 4, 2), cex.axis = 2, cex.lab = 2, cex.main = 3, font.lab = 2)\nplot(X, obs_y, ylim = c(-10, 10), main = \"GP fit\", xlab = \"X\", ylab = \"Y\",\n     cex = 1.5, pch = 16)\nlines(X, true_y, col = 2, lwd = 3)"
+    "objectID": "VB_TimeDepData.html#summary-of-ar1-behavior",
+    "href": "VB_TimeDepData.html#summary-of-ar1-behavior",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Summary of AR(1) behavior",
+    "text": "Summary of AR(1) behavior\n\n\\(\\color{dodgerblue}{|\\beta_1|&lt;1|}\\): The series has a mean level to which it reverts over time (stationary). For \\(+\\beta_1\\), the series tends to wander above or below the mean level for a while. For \\(-\\beta_1\\), the series tends to flip back and forth around the mean.\n\\(\\color{dodgerblue}{|\\beta_1|=1|}\\): A random walk series. The series has no mean level and, thus, is called nonstationary. The drift parameter \\(\\beta_0\\) is the direction in which the series wanders.\n\\(\\color{dodgerblue}{|\\beta_1|&gt;1|}\\): The series explodes, is nonstationary, and pretty much useless for prediction."
   },
   {
-    "objectID": "GP.html#toy-example-1d-example-1",
-    "href": "GP.html#toy-example-1d-example-1",
-    "title": "VectorByte Methods Training",
-    "section": "Toy Example (1D Example)",
-    "text": "Toy Example (1D Example)\n\n\neps &lt;- sqrt(.Machine$double.eps)\ngpi &lt;- laGP::newGP(X = X,Z = obs_y, d = 0.1, g = 0.1 * var(obs_y), dK = TRUE) \nmle &lt;- laGP::mleGP(gpi = gpi, param = c(\"d\", \"g\"), tmin= c(eps, eps), tmax= c(10, var(obs_y))) \n\nXX &lt;- matrix(seq(0, 2*pi, length = 1000), ncol =1)\np &lt;- laGP::predGP(gpi = gpi, XX = XX)"
+    "objectID": "VB_TimeDepData.html#arp-models",
+    "href": "VB_TimeDepData.html#arp-models",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "AR(\\(p\\)) models",
+    "text": "AR(\\(p\\)) models\nIt is possible to expand the AR idea to higher lags \\[\n\\color{red}{AR(p): Y_t = \\beta_0 + \\beta_1Y_{t-1} + \\cdots + \\beta_pY_{t-p} + \\varepsilon}.\n\\]\nHowever, it is seldom necessary to fit AR lags for \\(p&gt;1\\).\n\nLike having polynomial terms higher than 2, this just isn’t usually required in practice.\nYou lose all of the stationary/nonstationary intuition.\nOften, the need for higher lags is symptomatic of (missing) a more persistent trend or periodicity in the data, or needing predictors ..."
   },
   {
-    "objectID": "GP.html#anisotropic-gaussian-processes",
-    "href": "GP.html#anisotropic-gaussian-processes",
-    "title": "VectorByte Methods Training",
-    "section": "Anisotropic Gaussian Processes",
-    "text": "Anisotropic Gaussian Processes\nSuppose our data is multi-dimensional, we can control the length-scale (\\theta) for each dimension.\nIn this situation, we can rewrite the C_n matrix as,\nC_\\theta(x , x') = \\exp{ \\left( -\\sum_{k=1}^{m} \\frac{ (x_k - x_k')^2 }{\\theta_k} \\right ) + g \\mathbb{I_n}}\nHere, \\theta = (\\theta_1, \\theta_2, …, \\theta_m) is a vector of length-scales, where m = dimension of the input space.\n\nWe can adjust the decay of correlation per dimension."
+    "objectID": "VB_TimeDepData.html#trending-series",
+    "href": "VB_TimeDepData.html#trending-series",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Trending series",
+    "text": "Trending series\nOften, you’ll have a linear trend in your time series.\n\\(\\Rightarrow\\) AR structure, sloping up or down in time."
   },
   {
-    "objectID": "GP.html#heteroskedastic-gaussian-processes",
-    "href": "GP.html#heteroskedastic-gaussian-processes",
-    "title": "VectorByte Methods Training",
-    "section": "Heteroskedastic Gaussian Processes",
-    "text": "Heteroskedastic Gaussian Processes\n\n\nHeteroskedasticity implies that the data is noisy, and thee noise is irregular.\n\n\n\n\n\n\n\n\n\n\n\n\n\nA Heteroskedastic Gaussian Process (hetGP) is used when the data is noisy.\nNoise is usually input dependent and may vary with one or more predictors"
+    "objectID": "VB_TimeDepData.html#periodic-models",
+    "href": "VB_TimeDepData.html#periodic-models",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Periodic models",
+    "text": "Periodic models\nIt is very common to see seasonality or periodicity in series.\n\nTemperature goes up in Summer and down in Winter.\nGas consumption in Blacksburg would do the opposite.\n\nRecall the monthly lung infection data:\n\n\n\n\n\n\n\n\n\n\n\n\n\n\nAppears to oscillate on a 12-month cycle."
   },
   {
-    "objectID": "GP.html#hetgp-setup",
-    "href": "GP.html#hetgp-setup",
-    "title": "VectorByte Methods Training",
-    "section": "HetGP Setup",
-    "text": "HetGP Setup\n\nLet Y_n be the response vector of size n. Let X = (X_1, X_2 ... X_n) be the input space.\nThen, a regular GP is written as:\n\n\\begin{align*}\nY_N \\ & \\ \\sim GP \\left( 0 \\ , \\tau^2 C_n  \\right); \\ \\text{where, }\\\\[2pt]\nC_n  & \\ = \\exp{ \\left( -\\frac{\\vert\\vert x - x' \\vert \\vert ^2}{\\theta} \\right ) + g \\mathbb{I_n}}\n\\end{align*}\n\n\n\nIn case of a hetGP, we have:\n\n\\begin{aligned}\nY_n\\ & \\ \\sim GP \\left( 0 \\ , \\tau^2 C_{n, \\Lambda}  \\right) \\ \\ \\text{where, }\\\\[2pt]\nC_{n, \\Lambda}  & \\ = \\exp{ \\left( -\\frac{\\vert\\vert x - x' \\vert \\vert ^2}{\\theta} \\right ) + \\Lambda_n} \\ \\ \\ \\text{and, }\\ \\\\[2pt]\n\\ \\ \\Lambda_n \\  & \\ = \\ \\text{Diag}(\\lambda_1, \\lambda_2 ... , \\lambda_n) \\\\[2pt]\n\\end{aligned}\n\n\nInstead of one nugget for the GP, we have a vector of nuggets i.e. a unique nugget for each unique input.\n\n\n\n\nWe can make predictions exactly as seen in case of a GP in Equation(4) with \n\\begin{aligned}\n\\Sigma(X) \\ & \\ = \\nu \\left( \\ K_{\\theta_Y}(X) + \\Lambda_N(X) \\  \\right) \\\\[2pt]\n\\end{aligned}"
+    "objectID": "VB_TimeDepData.html#alternative-periodicity",
+    "href": "VB_TimeDepData.html#alternative-periodicity",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Alternative Periodicity",
+    "text": "Alternative Periodicity\nAn alternative way to add periodicity would be to simply add a dummy variable for each month (feb, mar, apr, ...).\n\nThis achieves basically the same fit as above, without requiring you to add sine or cosine.\nHowever, this takes 11 periodic parameters while we use only 2."
   },
   {
-    "objectID": "GP.html#toy-example-1d-example-2",
-    "href": "GP.html#toy-example-1d-example-2",
-    "title": "VectorByte Methods Training",
-    "section": "Toy Example (1D Example)",
-    "text": "Toy Example (1D Example)"
+    "objectID": "VB_TimeDepData.html#non-time-series-data",
+    "href": "VB_TimeDepData.html#non-time-series-data",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Non-time series data",
+    "text": "Non-time series data\n\nWhat happens if data aren’t evenly sampled?\n\n\nAll of the models/tools we explored that incorporate auto-correlation are not valid if data are not evenly spaced.\n\nYou can’t calculate an auto-correlation if the gap between data points and the earlier points aren’t all the same because we don’t expect all lags to have the same correlation.\n\n\nSo what can we do?"
   },
   {
-    "objectID": "GP.html#toy-example-1d-example-3",
-    "href": "GP.html#toy-example-1d-example-3",
-    "title": "VectorByte Methods Training",
-    "section": "Toy Example (1D Example)",
-    "text": "Toy Example (1D Example)"
+    "objectID": "VB_TimeDepData.html#time-dependent-predictors",
+    "href": "VB_TimeDepData.html#time-dependent-predictors",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Time Dependent Predictors",
+    "text": "Time Dependent Predictors\nOften we have additional measurements of possible covariates that might impact the time-dependent responses that we want to model. E.g. in VBD systems:\n\nweather variables: temperature, rainfall, humidity\nhabitat/climate variables: greenness, ENSO, land use, container densities\nsocio-economic variables: bed net coverage, insecticide spraying\n\nThese may all depend on time, and can be incorporated into a model for all time dependent data (including time series!)."
   },
   {
-    "objectID": "GP.html#toy-example-1d-example-4",
-    "href": "GP.html#toy-example-1d-example-4",
-    "title": "VectorByte Methods Training",
-    "section": "Toy Example (1D Example)",
-    "text": "Toy Example (1D Example)"
+    "objectID": "VB_TimeDepData.html#time-lagged-predictors",
+    "href": "VB_TimeDepData.html#time-lagged-predictors",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Time-Lagged Predictors",
+    "text": "Time-Lagged Predictors\nAdditionally, sometimes there may be a lag between an observed covariate and the response.\n\nExample: The number of people being hospitalized for dengue on a particular day reflect the number of people infected days before, and potentially mosquitoes infected days before that!\nThus, proxies of mosquito abundance, like temperature or humidity, weeks earlier may be appropriate predictors.\n\nHow can we determine an appropriate lag for a predictor?"
   },
   {
-    "objectID": "GP.html#intro-to-ticks-problem",
-    "href": "GP.html#intro-to-ticks-problem",
-    "title": "VectorByte Methods Training",
-    "section": "Intro to Ticks Problem",
-    "text": "Intro to Ticks Problem\n\nEFI-RCN held an ecological forecasting challenge\nWe focus on the Tick Populations theme which studies the abundance of the lone star tick (Amblyomma americanum)\n\nSome details about the challenge:\n\nObjective: Forecast tick density for 4 weeks into the future\nSites: The data is collected across 9 different sites, each plot was of size 1600m^2 using a drag cloth\nData: Sparse and irregularly spaced. We only have ~650 observations across 10 years at 9 locations"
+    "objectID": "VB_TimeDepData.html#two-strategies",
+    "href": "VB_TimeDepData.html#two-strategies",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Two Strategies",
+    "text": "Two Strategies\nThe first is what we might call a scientific approach:\n\nUsing our system knowledge, we can define what might be feasible time lags to include in a model, given evenly sampled predictor data. We decide and include just those a priori lags, and maybe do model/feature selection to narrow down.\n\nThis approach may miss a best lag for time series data, but is often the main way we can try to find appropriate lags for unevenly sampled data.\n(Note, we almost always assume a lag of at least 1.)"
   },
   {
-    "objectID": "GP.html#predictors",
-    "href": "GP.html#predictors",
-    "title": "VectorByte Methods Training",
-    "section": "Predictors",
-    "text": "Predictors\n\nX_1 Iso-week: The week in which the tick density was recorded.\nX_2 Sine wave: \\left( \\text{sin} \\ ( \\frac{2 \\ \\pi \\ X_1}{106} ) \\right)^2."
+    "objectID": "VB_TimeDepData.html#coming-up",
+    "href": "VB_TimeDepData.html#coming-up",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Coming up!",
+    "text": "Coming up!\nThe tools here are good, but not the best:\n\nIn many situations you want to allow for \\(\\beta\\) or \\(\\sigma\\) parameters that can change in time.\nThis can leave us with some left-over autocorrelation.\nWe’ll talk more about more sophisticated models over the next couple of days."
   },
   {
-    "objectID": "GP.html#practical",
-    "href": "GP.html#practical",
-    "title": "VectorByte Methods Training",
-    "section": "Practical",
-    "text": "Practical\n\nSetup these predictors\nTransform the data to normal\nFit a GP to the Data\nMake Predictions on a testing set\nCheck how predictions perform."
+    "objectID": "VB_TimeDepData.html#practice",
+    "href": "VB_TimeDepData.html#practice",
+    "title": "Regression Methods for Time Dependent Data",
+    "section": "Practice",
+    "text": "Practice\nNow we’ll practice combining our regression tools with these additional techniques for time-dependent data.\n\nRemember:\n\nAlso ways check your residual plots to ensure that your assumptions have been met\nTransformations are your friend!\nThink carefully about how to line up your lagged predictors"
   },
   {
-    "objectID": "GP_Notes.html",
-    "href": "GP_Notes.html",
-    "title": "VectorByte Methods Training",
+    "objectID": "about.html",
+    "href": "about.html",
+    "title": "About the VectorByte Training Materials 2024",
     "section": "",
-    "text": "This document introduces the conceptual background to Gaussian Process (GP) regression, along with mathematical concepts. We also demonstrate briefly fitting GPs using the laGP package in R. The material here is intended to give a more verbose introduction to what is covered in the lecture in order to support a student to work through the practical component. This material has been adapted from chapter 5 of the book Surrogates: Gaussian process modeling, design and optimization for the applied sciences by Robert Gramacy."
+    "text": "As the VectorByte team has developed these materials, we’ve aimed to provide resources for both guided (during the workshop) and self-led learning. We assume basic familiarity with:\n\nThe R Programming Language\nBasic calculus (especially the mathematical idea of functions)\nBasic probability and statistics (e.g., what is a probability distribution, normal and binomial distributions, means, variances)\nBasics of regression\n\nWe’ve divided the materials into subject matter modules or units. Each module is designed to build on the previous one, and expects at least knowledge of all of the preceding modules in the sequence in addition to the background material.\nEach module consists of four kinds of materials:\n\nslides with presentation of materials\nlabs/hands-on materials to allow you to practice material in a practical way\nsolutions to exercises, when necessary\n\nWe also include links to additional resources/materials/references.\nFor more information about the goals and approach of VectorByte are available at vectorbyte.org."
   },
   {
-    "objectID": "GP_Notes.html#introduction",
-    "href": "GP_Notes.html#introduction",
-    "title": "VectorByte Methods Training",
+    "objectID": "VB_RegRev.html",
+    "href": "VB_RegRev.html",
+    "title": "VectorByte Methods Training: Regression Review",
     "section": "",
-    "text": "A Gaussian Process (GP) is a non-parameteric and flexible method to model data. Here, we assume that the data follow a Multivariate Normal Distribution. It is widely used in the fields of spatial statistics commonly known as kriging as well as machine learning as a surrogate model due to it’s ability of making fast predictions with good uncertainty quantification.\nIn spatial statistics, we want to emphasize the relationship between the distance of different locations along with the response of interest. A GP allows us to do that as we will see in this tutorial. A different application of a GP involves it’s usage as a surrogate. A surrogate model is used to approximate a computer model and/or field experiments where running the experiments may be cost or time ineffective and/or infeasible.\nFor e.g. Suppose we wish to estimate the amount of energy released when a bomb explodes. Conducting this experiment repeatedly a large number of times to collect data seems infeasible. In such cases, we can use a surrogate model to the field data and make predictions for different input locations.\nIn the field of ecology, as we will see in this tutorial, we will use a Gaussian Process model as a Non-Parametric Regression tool, similar to Linear Regression. We will assume our data follows a GP, and use Bayesian Methods to infer the distribution of new locations given the data. The predictions obtained will have good uncertainty quantification which is ofcourse valuable in this field due to the noisy nature of our data."
+    "text": "Main materials"
   },
   {
-    "objectID": "VB_TimeDepData_practical.html#exploring-the-data",
-    "href": "VB_TimeDepData_practical.html#exploring-the-data",
-    "title": "VectorByte Methods Training",
-    "section": "Exploring the Data",
-    "text": "Exploring the Data\nAs always, we first want to take a look at the data, to make sure we understand it, and that we don’t have missing or weird values.\n\nmozData&lt;-read.csv(\"data/Culex_erraticus_walton_covariates_aggregated.csv\")\nsummary(mozData)\n\n   Month_Yr          sample_value        MaxTemp          Precip      \n Length:36          Min.   :0.00000   Min.   :16.02   Min.   : 0.000  \n Class :character   1st Qu.:0.04318   1st Qu.:22.99   1st Qu.: 2.162  \n Mode  :character   Median :0.73001   Median :26.69   Median : 4.606  \n                    Mean   :0.80798   Mean   :26.23   Mean   : 5.595  \n                    3rd Qu.:1.22443   3rd Qu.:30.70   3rd Qu.: 7.864  \n                    Max.   :3.00595   Max.   :33.31   Max.   :18.307  \n\n\nWe can see that the minimum observed average number of mosquitoes it zero, and max is only 3 (there are likely many zeros averaged over many days in the month). There don’t appear to be any NAs in the data. In this case the dataset itself is small enough that we can print the whole thing to ensure it’s complete:\n\nmozData\n\n   Month_Yr sample_value  MaxTemp       Precip\n1   2015-01  0.000000000 17.74602  3.303991888\n2   2015-02  0.018181818 17.87269 16.544265802\n3   2015-03  0.468085106 23.81767  2.405651215\n4   2015-04  1.619047619 26.03559  8.974406168\n5   2015-05  0.821428571 30.01602  0.567960943\n6   2015-06  3.005952381 31.12094  4.841342729\n7   2015-07  2.380952381 32.81130  3.849010353\n8   2015-08  1.826347305 32.56245  5.562845324\n9   2015-09  0.648809524 30.55155 10.409724627\n10  2015-10  0.988023952 27.22605  0.337750269\n11  2015-11  0.737804878 24.86768 18.306749680\n12  2015-12  0.142857143 22.46588  5.621475377\n13  2016-01  0.000000000 16.02406  3.550622029\n14  2016-02  0.020202020 19.42057 11.254680803\n15  2016-03  0.015151515 23.13610  4.785664728\n16  2016-04  0.026143791 24.98082  4.580424519\n17  2016-05  0.025252525 28.72884  0.053057634\n18  2016-06  0.833333333 30.96990  6.155417473\n19  2016-07  1.261363636 33.30509  4.496368193\n20  2016-08  1.685279188 32.09633 11.338749182\n21  2016-09  2.617142857 31.60575  2.868288451\n22  2016-10  1.212121212 29.14275  0.000000000\n23  2016-11  1.539772727 24.48482  0.005462681\n24  2016-12  0.771573604 20.46054 11.615521725\n25  2017-01  0.045454545 18.35473  0.000000000\n26  2017-02  0.036363636 23.65584  3.150710053\n27  2017-03  0.194285714 22.53573  1.430094952\n28  2017-04  0.436548223 26.15299  0.499381616\n29  2017-05  1.202020202 28.00173  6.580562663\n30  2017-06  0.834196891 29.48951 13.333939858\n31  2017-07  1.765363128 32.25135  7.493927035\n32  2017-08  0.744791667 31.86476  6.082113434\n33  2017-09  0.722222222 30.60566  4.631037395\n34  2017-10  0.142131980 27.73453 11.567112214\n35  2017-11  0.289772727 23.23140  1.195760473\n36  2017-12  0.009174312 18.93603  4.018254442"
+    "objectID": "VB_RegRev.html#mc-simulation-of-simple-system",
+    "href": "VB_RegRev.html#mc-simulation-of-simple-system",
+    "title": "VectorByte Methods Training: Regression Review",
+    "section": "MC simulation of simple system",
+    "text": "MC simulation of simple system"
   },
   {
-    "objectID": "VB_TimeDepData_practical.html#plotting-the-data",
-    "href": "VB_TimeDepData_practical.html#plotting-the-data",
-    "title": "VectorByte Methods Training",
-    "section": "Plotting the data",
-    "text": "Plotting the data\nFirst we’ll examine the data itself, including the predictors:\n\nmonths&lt;-dim(mozData)[1]\nt&lt;-1:months ## counter for months in the data set\npar(mfrow=c(3,1))\nplot(t, mozData$sample_value, type=\"l\", lwd=2, \n     main=\"Average Monthly Abundance\", \n     xlab =\"Time (months)\", \n     ylab = \"Average Count\")\nplot(t, mozData$MaxTemp, type=\"l\",\n     col = 2, lwd=2, \n     main=\"Average Maximum Temp\", \n     xlab =\"Time (months)\", \n     ylab = \"Temperature (C)\")\nplot(t, mozData$Precip, type=\"l\",\n     col=\"dodgerblue\", lwd=2,\n     main=\"Average Monthly Precip\", \n     xlab =\"Time (months)\", \n     ylab = \"Precipitation (in)\")\n\n\n\n\n\n\n\n\nVisually we noticed that there may be a bit of clumping in the values for abundance (this is subtle) – in particular, since we have a lot of very small/nearly zero counts, a transform, such as a square root, may spread things out for the abundances. It also looks like both the abundance and temperature data are more cyclical than the precipitation, and thus more likely to be related to each other. There’s also not visually a lot of indication of a trend, but it’s usually worthwhile to consider it anyway. Replotting the abundance data with a transformation:\n\nmonths&lt;-dim(mozData)[1]\nt&lt;-1:months ## counter for months in the data set\nplot(t, sqrt(mozData$sample_value), type=\"l\", lwd=2, \n     main=\"Sqrt Average Monthly Abundance\", \n     xlab =\"Time (months)\", \n     ylab = \"Average Count\")\n\n\n\n\n\n\n\n\nThat looks a little bit better. I suggest we go with this for our response."
+    "objectID": "VB_RegRev.html#changes-in-population-size",
+    "href": "VB_RegRev.html#changes-in-population-size",
+    "title": "VectorByte Methods Training: Regression Review",
+    "section": "Changes in population size",
+    "text": "Changes in population size"
   },
   {
-    "objectID": "VB_TimeDepData_practical.html#building-a-data-frame",
-    "href": "VB_TimeDepData_practical.html#building-a-data-frame",
-    "title": "VectorByte Methods Training",
-    "section": "Building a data frame",
-    "text": "Building a data frame\nBefore we get into model building, we always want to build a data frame to contain all of the predictors that we want to consider, at the potential lags that we’re interested in. In the lecture we saw building the AR, sine/cosine, and trend predictors:\n\nt &lt;- 2:months ## to make building the AR1 predictors easier\n\nmozTS &lt;- data.frame(\n  Y=sqrt(mozData$sample_value[t]), # transformed response\n  Yl1=sqrt(mozData$sample_value[t-1]), # AR1 predictor\n  t=t, # trend predictor\n  sin12=sin(2*pi*t/12), \n  cos12=cos(2*pi*t/12) # periodic predictors\n  )\n\nWe will also put in the temperature and precipitation predictors. But we need to think about what might be an appropriate lag. If this were daily or weekly data, we’d probably want to have a fairly sizable lag – mosquitoes take a while to develop, so the number we see today is not likely related to the temperature today. However, since these data are agregated across a whole month, as is the temperature/precipitaion, the current month values are likely to be useful. However, it’s even possible that last month’s values may be so we’ll add those in as well:\n\nmozTS$MaxTemp&lt;-mozData$MaxTemp[t] ## current temps\nmozTS$MaxTempl1&lt;-mozData$MaxTemp[t-1] ## previous temps\nmozTS$Precip&lt;-mozData$Precip[t] ## current precip\nmozTS$Precipl1&lt;-mozData$Precip[t-1] ## previous precip\n\nThus our full dataframe:\n\nsummary(mozTS)\n\n       Y               Yl1               t            sin12         \n Min.   :0.0000   Min.   :0.0000   Min.   : 2.0   Min.   :-1.00000  \n 1st Qu.:0.2951   1st Qu.:0.2951   1st Qu.:10.5   1st Qu.:-0.68301  \n Median :0.8590   Median :0.8590   Median :19.0   Median : 0.00000  \n Mean   :0.7711   Mean   :0.7684   Mean   :19.0   Mean   :-0.01429  \n 3rd Qu.:1.1120   3rd Qu.:1.1120   3rd Qu.:27.5   3rd Qu.: 0.68301  \n Max.   :1.7338   Max.   :1.7338   Max.   :36.0   Max.   : 1.00000  \n     cos12             MaxTemp        MaxTempl1         Precip      \n Min.   :-1.00000   Min.   :16.02   Min.   :16.02   Min.   : 0.000  \n 1st Qu.:-0.68301   1st Qu.:23.18   1st Qu.:23.18   1st Qu.: 1.918  \n Median : 0.00000   Median :27.23   Median :27.23   Median : 4.631  \n Mean   :-0.02474   Mean   :26.47   Mean   :26.44   Mean   : 5.660  \n 3rd Qu.: 0.50000   3rd Qu.:30.79   3rd Qu.:30.79   3rd Qu.: 8.234  \n Max.   : 1.00000   Max.   :33.31   Max.   :33.31   Max.   :18.307  \n    Precipl1     \n Min.   : 0.000  \n 1st Qu.: 1.918  \n Median : 4.631  \n Mean   : 5.640  \n 3rd Qu.: 8.234  \n Max.   :18.307  \n\n\n\nhead(mozTS)\n\n          Y       Yl1 t         sin12         cos12  MaxTemp MaxTempl1\n1 0.1348400 0.0000000 2  8.660254e-01  5.000000e-01 17.87269  17.74602\n2 0.6841675 0.1348400 3  1.000000e+00  6.123234e-17 23.81767  17.87269\n3 1.2724180 0.6841675 4  8.660254e-01 -5.000000e-01 26.03559  23.81767\n4 0.9063270 1.2724180 5  5.000000e-01 -8.660254e-01 30.01602  26.03559\n5 1.7337683 0.9063270 6  1.224647e-16 -1.000000e+00 31.12094  30.01602\n6 1.5430335 1.7337683 7 -5.000000e-01 -8.660254e-01 32.81130  31.12094\n      Precip   Precipl1\n1 16.5442658  3.3039919\n2  2.4056512 16.5442658\n3  8.9744062  2.4056512\n4  0.5679609  8.9744062\n5  4.8413427  0.5679609\n6  3.8490104  4.8413427"
+    "objectID": "VB_RegRev.html#sequential-observations",
+    "href": "VB_RegRev.html#sequential-observations",
+    "title": "VectorByte Methods Training: Regression Review",
+    "section": "Sequential observations",
+    "text": "Sequential observations\n\n\n\n\n\n\n\n\n\n\n\n\n\nIf we had just observed these data, how might we try to estimate parameters?"
   },
   {
-    "objectID": "VB_TimeDepData_practical.html#building-a-first-model",
-    "href": "VB_TimeDepData_practical.html#building-a-first-model",
-    "title": "VectorByte Methods Training",
-    "section": "Building a first model",
-    "text": "Building a first model\nWe will first build a very simple model – just a trend – to practice building the model, checking diagnostics, and plotting predictions.\n\nmod1&lt;-lm(Y ~ t, data=mozTS)\nsummary(mod1)\n\n\nCall:\nlm(formula = Y ~ t, data = mozTS)\n\nResiduals:\n     Min       1Q   Median       3Q      Max \n-0.81332 -0.47902  0.03671  0.37384  0.87119 \n\nCoefficients:\n             Estimate Std. Error t value Pr(&gt;|t|)    \n(Intercept)  0.904809   0.178421   5.071  1.5e-05 ***\nt           -0.007038   0.008292  -0.849    0.402    \n---\nSignif. codes:  0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1\n\nResidual standard error: 0.4954 on 33 degrees of freedom\nMultiple R-squared:  0.02136,   Adjusted R-squared:  -0.008291 \nF-statistic: 0.7204 on 1 and 33 DF,  p-value: 0.4021\n\n\nThe model output indicates that this model is not useful – the trend is not significant and it only explains about 2% of the variability. Let’s plot the predictions:\n\n## plot points and fitted lines\nplot(Y~t, data=mozTS, col=1, type=\"l\")\nlines(t, mod1$fitted, col=\"dodgerblue\", lwd=2)\n\n\n\n\n\n\n\n\nNot good – we’ll definitely need to try something else! Remember that since we’re using a linear model for this, that we should check our residual plots as usual, and then also plot the acf of the residuals:\n\npar(mfrow=c(1,3), mar=c(4,4,2,0.5))   \n\n## studentized residuals vs fitted\nplot(mod1$fitted, rstudent(mod1), col=1,\n     xlab=\"Fitted Values\", \n     ylab=\"Studentized Residuals\", \n     pch=20, main=\"AR 1 only model\")\n\n## qq plot of studentized residuals\nqqnorm(rstudent(mod1), pch=20, col=1, main=\"\" )\nabline(a=0,b=1,lty=2, col=2)\n\n## histogram of studentized residuals\nhist(rstudent(mod1), col=1, \n     xlab=\"Studentized Residuals\", \n     main=\"\", border=8)\n\n\n\n\n\n\n\n\nThis doesn’t look really bad, although the histogram might be a bit weird. Finally the acf\n\nacf(mod1$residuals)\n\n\n\n\n\n\n\n\nThis is where we can see that we definitely aren’t able to capture the pattern. There’s substantial autocorrelation left at a 1 month lag, and around 6 months.\nFinally, for moving forward, we can extract the BIC for this model so that we can compare with other models that you’ll build next.\n\nn&lt;-length(t)\nextractAIC(mod1, k=log(n))[2]\n\n[1] -44.11057"
+    "objectID": "VB_RegRev.html#sampling-distribution-of-ls-line",
+    "href": "VB_RegRev.html#sampling-distribution-of-ls-line",
+    "title": "VectorByte Methods Training: Regression Review",
+    "section": "Sampling distribution of LS line",
+    "text": "Sampling distribution of LS line\nWhat did we just do?\n\nWe “imagined” through simulation the sampling distribution of a LS line.\n\nIn real life we get just one data set, and we don’t know the true generating model. But we can still imagine.\n\nWe first find the sampling distribution of our LS coefficients, b_0 and b_1…\n… which requires some review.\n\nIn the online reading and review materials you should have come across some useful probability/stats facts, including:\n\n\\mathbb{E}(X_1+X_2) = \\mathbb{E}(X_1)+ \\mathbb{E}(X_2)\n\\mathbb{E}(cX_1) = c \\mathbb{E}(X_1)\n\\text{var}(c X_1) = c^2\\text{var}(X_1)\n\\text{var}(X_1+X_2) = \\text{var}(X_1)+\\text{var}(X_2) + 2\\text{cov}(X_1 X_2).\n\n\nRecall: distribution of the sample mean\n\nStep back for a moment and consider the mean for an iid sample of n observations of a random variable \\{X_1,\\ldots,X_n\\}.\n\nSuppose that \\mathbb{E}(X_i) = \\mu and \\text{var}(X_i) = \\sigma^2, then\n\n\\mathbb{E}(\\bar{X}) = \\frac{1}{n} \\sum\\mathbb{E}(X_i) = \\mu\n\\text{var}(\\bar{X}) = \\text{var}\\left( \\frac{1}{n} \\sum X_i \\right) = \\frac{1}{n^2} \\sum \\text{var}\\left( X_i \\right) = \\displaystyle \\frac{\\sigma^2}{n}."
   },
   {
-    "objectID": "GP_Practical.html",
-    "href": "GP_Practical.html",
-    "title": "VectorByte Methods Training",
-    "section": "",
-    "text": "This practical will lead you through fitting a few versions of GPs using two R packages: laGP and hetGP. We will begin with a toy example from the lecture and then move on to a real data example to forecast tick abundances for a NEON site."
+    "objectID": "VB_RegRev.html#central-limit-theorem",
+    "href": "VB_RegRev.html#central-limit-theorem",
+    "title": "VectorByte Methods Training: Regression Review",
+    "section": "Central Limit Theorem",
+    "text": "Central Limit Theorem\nThe CLT states that for iid random variables, X, with mean \\mu and variance \\sigma^2, the distribution of the sample mean becomes normal as the number of observations, n, gets large.\n\nThat is, \\displaystyle \\bar{X} \\rightarrow_{n} \\mathcal{N}(\\mu, \\sigma^2/n) , and sample averages tend to be normally distributed in large samples.\n\nWe are now ready to describe the sampling distribution of the least squares line …\n… in terms of its effect on the sampling distributions of the coefficients\n\nb_1 = \\hat{\\beta~}_1, the slope of the line\nb_0 = \\hat{\\beta~}_0, the intercept,\nand how they covary together,\n\ngiven a particular (fixed) set of X-values."
   },
   {
-    "objectID": "GP_Practical.html#gaussian-processes",
-    "href": "GP_Practical.html#gaussian-processes",
-    "title": "Gaussian Processes: Practical",
-    "section": "",
-    "text": "Remember the function we looked at before? \\[Y(x) = 5 \\ \\sin(x)\\] Now, let’s learn how we actually use the library laGP to fit a GP and make predictions at new locations. Let’s begin by loading some libraries\n\nlibrary(mvtnorm)\nlibrary(laGP)\nlibrary(hetGP)\nlibrary(ggplot2)\n\nNow we create the data for our example. (X, y) is our given data,\n\n# number of data points\nn &lt;- 8 \n\n# Inputs - between 0 and 2pi\nX &lt;- matrix(seq(0, 2*pi, length= n), ncol=1) \n\n# Creating the response using the formula\ny &lt;- 5*sin(X)\n\nFirst we use the newGP function to fit our GP. In this function, we need to pass in our inputs, outputs and any known parameters. If we do not know parameters, we can pass in some prior information we know about the parameters (which we will learn shortly) so that calculating the MLE is easier. Here, X indicates the input which must be a matrix, Z is used for response which is a vector, d is used for \\(\\theta\\) (length-scale), a scalar, which we assume to be known and equal to 1 and g is the nugget effect which is also a scalar. We pass in a very small value for numeric stability.\n\n# Fitting GP \ngpi &lt;- newGP(X = X, Z = y, d = 1, g = sqrt(.Machine$double.eps))\n\nNow we have fit the GP and if you print gpi it only outputs a number. This is because it assigns a number to the model as a reference but has everything stored within it. We needn’t get into the details of this in this tutorial. We can assume that our model is stored in gpi and all we see is the reference number.\nWe will use XX as our predictive set i.e. we want to make predictions at those input locations. I have created this as a vector of 100 points between -0.5 and \\(2 \\pi\\) + 0.5. We are essentially using 8 data points to make predictions at 100 points. Let’s see how we do. We make use of the predGP function.\nWe need to pass our GP object as gpi = gpi (in our case) and the predictive input locations XX = XX for this.\n\n# Predictions\n\n# Creating a prediction set: sequence from -0.5 to 2*pi + 0.5 with 100 evenly spaced points\nXX &lt;- matrix(seq(-0.5, 2*pi + 0.5, length= 100), ncol=1)\n\n# Using the function to make predictions using our gpi object\nyy &lt;- predGP(gpi = gpi, XX = XX)\n\n# This will tell us the results that we have stored.\nnames(yy)\n\n[1] \"mean\"  \"Sigma\" \"df\"    \"llik\" \n\n\nnames(yy) will tell us what is stored in yy. As we can see, we have the mean i.e. the mean predictions \\(\\mu\\) and, Sigma i.e. the covariance matrix \\(\\Sigma\\).\nNow we can draw 100 random draws using the mean and variance matrix we obtained. We will also obtain the confidence bounds as shown below:\n\n# Since our posterior is a distribution, we take 100 samples from this.\nYY &lt;- rmvnorm (100, yy$mean, yy$Sigma)\n\n# We calculate the 95% bounds\nq1 &lt;- yy$mean + qnorm(0.025, 0, sqrt(diag(yy$Sigma))) \nq2 &lt;- yy$mean + qnorm(0.975, 0, sqrt(diag(yy$Sigma))) \n\nNow, we will plot the mean prediction and the bounds along with each of our 100 draws.\n\n# Now for the plot\ndf &lt;- data.frame(\n  XX = rep(XX, each = 100),\n  YY = as.vector(YY),\n  Line = factor(rep(1:100, 100))\n)\nggplot() +\n  # Plotting all 100 draws from our distribution\n  geom_line(aes(x = df$XX, y = df$YY, group = df$Line), color = \"darkgray\", alpha = 0.5,\n            linewidth =1.5) +\n  # Plotting our data points\n  geom_point(aes(x = X, y = y), shape = 20, size = 10, color = \"darkblue\") +\n  # Plotting the mean from our 100 draws\n  geom_line(aes(x = XX, y = yy$mean), size = 1, linewidth =3) +\n  # Adding the True function\n  geom_line(aes(x = XX, y = 5*sin(XX)), color = \"blue\", linewidth =3, alpha = 0.8) +\n  # Adding quantiles\n  geom_line(aes(x = XX, y = q1), linetype = \"dashed\", color = \"red\", size = 1,\n            alpha = 0.7,linewidth =2) +\n  geom_line(aes(x = XX, y = q2), linetype = \"dashed\", color = \"red\", size = 1,\n            alpha = 0.7,linewidth =2) +\n  labs(x = \"x\", y = \"y\") +\n  # Setting the themes\n  theme_minimal() + \n  theme(\n    axis.text.x = element_text(angle = 45, hjust = 1, size = 25, face = \"bold\"),\n    axis.text.y = element_text(size = 25, face = \"bold\"),\n    axis.title.y = element_text(margin = margin(r = 10), size = 20, face = \"bold\"),\n    axis.title.x = element_text(margin = margin(r = 10), size = 20, face = \"bold\"),\n    panel.grid.major = element_blank(),\n    panel.grid.minor = element_blank(),\n    panel.background = element_rect(fill = \"white\"),\n    strip.background = element_rect(fill = \"white\", color = \"white\"),\n    strip.text = element_text(color = \"black\")) +\n  guides(color = \"none\")\n\n\n\n\n\n\n\n\nLooks pretty cool.\nWe will try all this on a simple dataset: Tick Data from NEON Forecasting Challenge. We will first learn a little bit about this dataset, followed by setting up our predictors and using them in our model to predict tick density for the future season. We will also learn how to fit a separable GP and specify priors for our parameters. Finally, we will learn some basics about a HetGP (Heteroskedastic GP) and try and fit that model as well.\n\n\n\n\nObjective: Forecast tick density for 4 weeks into the future\nSites: The data is collected across 9 different sites, each plot was of size 1600\\(m^2\\) using a drag cloth\nData: Sparse and irregularly spaced. We only have ~650 observations across 10 years at 9 locations\n\nLet’s start with loading all the libraries that we will need, load our data and understand what we have.\n\nlibrary(tidyverse)\nlibrary(laGP)\nlibrary(ggplot2)\n\n# Pulling the data from the NEON data base. \ntarget &lt;- readr::read_csv(\"https://data.ecoforecast.org/neon4cast-targets/ticks/ticks-targets.csv.gz\", guess_max = 1e1)\n\n# Visualizing the data\nhead(target)\n\n# A tibble: 6 × 5\n  datetime   site_id variable             observation iso_week\n  &lt;date&gt;     &lt;chr&gt;   &lt;chr&gt;                      &lt;dbl&gt; &lt;chr&gt;   \n1 2015-04-20 BLAN    amblyomma_americanum        0    2015-W17\n2 2015-05-11 BLAN    amblyomma_americanum        9.82 2015-W20\n3 2015-06-01 BLAN    amblyomma_americanum       10    2015-W23\n4 2015-06-08 BLAN    amblyomma_americanum       19.4  2015-W24\n5 2015-06-22 BLAN    amblyomma_americanum        3.14 2015-W26\n6 2015-07-13 BLAN    amblyomma_americanum        3.66 2015-W29\n\n\n\n\n\nFor a GP model, we assume the response (\\(Y\\)) should be normally distributed.\nSince tick density, our response, must be greater than 0, we need to use a transform.\nThe following is the most suitable transform for our application:\n\n\n\\[\\begin{equation}\n\\begin{aligned}\nf(y) \\ & = \\text{log } \\ (y + 1) \\ \\ ; \\ \\ \\ \\\\[2pt]\n&lt;!-- \\ & = \\sqrt{y} \\ \\ \\ \\; \\ \\ \\ otherwise --&gt;\n\\end{aligned}\n\\end{equation}\\]\nWe pass in (\\(response\\) + 1) into this function to ensure we don’;t take a log of 0. We will adjust this in our back transform.\nLet’s write a function for this, as well as the inverse of the transform.\n\n# transforms y\nf &lt;- function(x) {\n  y &lt;- log(x + 1)\n  return(y)\n}\n\n# This function back transforms the input argument\nfi &lt;- function(y) {\n  x &lt;- exp(y) - 1\n  return(x)\n}\n\n\n\n\n\nThe goal is to forecast tick populations for a season so our response (Y) here, is the tick density. However, we do not have a traditional data set with an obvious input space. What is the X? \n\nWe made a few plots earlier to help us identify what can be useful:\n\n\\(X_1\\) Iso-week: This is the iso-week number\nLet’s convert the iso-week from our target dataset as a numeric i.e. a number. Here is a function to do the same.\n\n# This function tells us the iso-week number given the date\nfx.iso_week &lt;- function(datetime){\n  # Gives ISO-week in the format yyyy-w## and we extract the ##\n  x1 &lt;- as.numeric(stringr::str_sub(ISOweek::ISOweek(datetime), 7, 8)) # find iso week #\n  return(x1)\n}\n\ntarget$week &lt;- fx.iso_week(target$datetime)\nhead(target)\n\n# A tibble: 6 × 6\n  datetime   site_id variable             observation iso_week  week\n  &lt;date&gt;     &lt;chr&gt;   &lt;chr&gt;                      &lt;dbl&gt; &lt;chr&gt;    &lt;dbl&gt;\n1 2015-04-20 BLAN    amblyomma_americanum        0    2015-W17    17\n2 2015-05-11 BLAN    amblyomma_americanum        9.82 2015-W20    20\n3 2015-06-01 BLAN    amblyomma_americanum       10    2015-W23    23\n4 2015-06-08 BLAN    amblyomma_americanum       19.4  2015-W24    24\n5 2015-06-22 BLAN    amblyomma_americanum        3.14 2015-W26    26\n6 2015-07-13 BLAN    amblyomma_americanum        3.66 2015-W29    29\n\n\n\n\\(X_2\\) Sine wave: We use this to give our model phases. We can consider this as a proxy to some other variables such as temperature which would increase from Jan to about Jun-July and then decrease. We use the following sin wave\n\n\\(X_2 = \\left( \\text{sin} \\ \\left( \\frac{2 \\ \\pi \\ X_1}{106} \\right) \\right)^2\\) where, \\(X_1\\) is the iso-week.\nUsually, a Sin wave for a year would have the periodicity of 53 to indicate 53 weeks. Why have we chosen 106 as our period? And we do we square it?\nLet’s use a visual to understand that.\n\nx &lt;- c(1:106)\nsin_53 &lt;- sin(2*pi*x/53)\nsin_106 &lt;- (sin(2*pi*x/106))\nsin_106_2 &lt;- (sin(2*pi*x/106))^2\n\npar(mfrow=c(1, 3), mar = c(4, 5, 4, 1), cex.axis = 2, cex.lab = 2, cex.main = 3, font.lab = 2)\nplot(x, sin_53, col = 2, pch = 19, ylim = c(-1, 1), ylab = \"sin wave\", main = \"period = 53\")\nabline(h = 0, lwd = 2)\nplot(x, sin_106, col = 3, pch = 19, ylim = c(-1, 1), ylab = \"sin wave\", main = \"period = 106\")\nabline(h = 0, lwd = 2)\nplot(x, sin_106_2, col = 4, pch = 19, ylim = c(-1, 1), ylab = \"sin wave\", main = \"period = 106 squared\")\nabline(h = 0, lwd = 2)\n\n\n\n\n\n\n\n\nSome observations:\n\nThe sin wave (period 53) goes increases from (0, 1) and decreases all the way to -1 before coming back to 0, all within the 53 weeks in the year. But this is not what we want to achieve.\nWe want the function to increase from Jan - Jun and then start decreasing till Dec. This means, we need a regular sin-wave to span 2 years so we can see this.\nWe also want the next year to repeat the same pattern i.e. we want to restrict it to [0, 1] interval. Thus, we square the sin wave.\n\n\nfx.sin &lt;- function(datetime, f1 = fx.iso_week){\n  # identify iso week#\n  x &lt;- f1(datetime) \n  # calculate sin value for that week\n  x2 &lt;- (sin(2*pi*x/106))^2 \n  return(x2)\n}\n\nFor a GP, it’s also useful to ensure that all our X’s are between 0 and 1. Usually this is done by using the following method\n\\(X_i^* = \\frac{X_i - \\min(X)}{\\max(X) - \\min(X) }\\) where \\(X = (X_1, X_2 ...X_n)\\)\n\\(X^* = (X_1^*, X_2^* ... X_n^*)\\) will be the standarized \\(X\\)’s with all \\(X_i^*\\) in the interval [0, 1].\nWe can either write a function for this, or in our case, we can just divide Iso-week by 53 since that would result effectively be the same. Our Sin Predictor already lies in the interval [0, 1].\n\n\n\n\nNow, let’s start with modelling. We will start with one random location out of the 9 locations.\n\n# Choose a random site number: Anything between 1-9.\nsite_number &lt;- 6\n\n# Obtaining site name\nsite_names &lt;- unique(target$site_id)\n\n# Subsetting all the data at that location\ndf &lt;- subset(target, target$site_id == site_names[site_number])\nhead(df)\n\n# A tibble: 6 × 6\n  datetime   site_id variable             observation iso_week  week\n  &lt;date&gt;     &lt;chr&gt;   &lt;chr&gt;                      &lt;dbl&gt; &lt;chr&gt;    &lt;dbl&gt;\n1 2014-06-09 SCBI    amblyomma_americanum       75.9  2014-W24    24\n2 2014-06-30 SCBI    amblyomma_americanum       28.3  2014-W27    27\n3 2014-07-21 SCBI    amblyomma_americanum        0    2014-W30    30\n4 2014-07-28 SCBI    amblyomma_americanum       10.1  2014-W31    31\n5 2014-08-11 SCBI    amblyomma_americanum        4.94 2014-W33    33\n6 2014-10-20 SCBI    amblyomma_americanum        0    2014-W43    43\n\n\nWe will also select only those columns that we are interested in i.e. datetime and obervation. We don’t need site since we are only using one of them.\n\n# extracting only the datetime and obs columns\ndf &lt;- df[, c(\"datetime\", \"observation\")]\n\nWe will use one site at first and fit a GP and make predictions. For this we first need to divide our data into a training set and a testing set. Since we have time series, we want to divide the data sequentially, i.e. we pick a date and everything before the date is our training set and after is our testing set where we check how well our model performs. We choose the date 2020-12-31.\n\n# Selecting a date before which we consider everything as training data and after this is testing data.\ncutoff = as.Date('2020-12-31')\ndf_train &lt;- subset(df, df$datetime &lt;= cutoff)\ndf_test &lt;- subset(df, df$datetime &gt; cutoff)\n\n\n\nNow we will setup our X’s. We already have the functions to do this and can simply pass in the datetime. We then combine \\(X_1\\) and \\(X_2\\) to create out input matrix \\(X\\). Remember, everything is ordered as in our dataset.\n\n# Setting up iso-week and sin wave predictors by calling the functions\nX1 &lt;- fx.iso_week(df_train$datetime) # range is 1-53\nX2 &lt;- fx.sin(df_train$datetime) # range is 0 to 1\n\n# Centering the iso-week by diving by 53\nX1c &lt;- X1/ 53\n\n# We combine columns centered X1 and X2, into a matrix as our input space\nX &lt;- as.matrix(cbind.data.frame(X1c, X2))\nhead(X)\n\n           X1c        X2\n[1,] 0.4528302 0.9782005\n[2,] 0.5094340 0.9991219\n[3,] 0.5660377 0.9575728\n[4,] 0.5849057 0.9305218\n[5,] 0.6226415 0.8587536\n[6,] 0.8113208 0.3120862\n\n\nNext step is to tranform the response to ensure it is normal.\n\n# Extract y: observation from our training model. \ny_obs &lt;- df_train$observation\n\n# Transform the response\ny &lt;- f(y_obs)\n\nNow, we can use the laGP library to fit a GP. First, we specify priors using darg and garg. We will specify a minimum and maximum for our arguments. We need to pass the input space for darg and the output vector for garg. You can look into the functions using ?function in R. We set the minimum to a very small value rather than 0 to ensure numeric stability.\n\n# A very small value for stability\neps &lt;- sqrt(.Machine$double.eps) \n  \n# Priors for theta and g. \nd &lt;- darg(list(mle=TRUE, min =eps, max=5), X)\ng &lt;- garg(list(mle=TRUE, min = eps, max = 1), y)\n\nNow, to fit the GP, we use newGPsep. We pass the input matrix and the response vector with some values of the parameters. Then, we use the jmleGPsep function to jointly estimate \\(\\theta\\) and \\(g\\) using MLE method. dK allows the GP object to store derivative information which is needed for MLE calculations. newGPsep will fit a separable GP as opposed to newGP which would fit an isotropic GP.\n\n# Fitting a GP with our data, and some starting values for theta and g\ngpi &lt;- newGPsep(X, y, d = 0.1, g = 1, dK = T)\n\n# Jointly infer MLE for all parameters\nmle &lt;- jmleGPsep(gpi, drange = c(d$min, d$max), grange = c(g$min, g$max), \n                 dab = d$ab, gab=  g$ab)\n\nNow, we will create a grid from the first week in our dataset to 1 year into the future, and predict on the entire time series. We use predGPsep to make predictions.\n\n# Create a grid from start date in our data set to one year in future (so we forecast for next season)\nstartdate &lt;- as.Date(min(df$datetime))# identify start week\ngrid_datetime &lt;- seq.Date(startdate, Sys.Date() + 365, by = 7) # create sequence from \n\n# Build the inpu space for the predictive space (All weeks from 04-2014 to 07-2025)\nXXt1 &lt;- fx.iso_week(grid_datetime)\nXXt2 &lt;- fx.sin(grid_datetime)\n\n# Standardize\nXXt1c &lt;- XXt1/53\n\n# Store inputs as a matrix\nXXt &lt;- as.matrix(cbind.data.frame(XXt1c, XXt2))\n\n# Make predictions using predGP with the gp object and the predictive set\nppt &lt;- predGPsep(gpi, XXt) \n\nStoring the mean and calculating quantiles.\n\n# Now we store the mean as our predicted response i.e. density along with quantiles\nyyt &lt;- ppt$mean\nq1t &lt;- ppt$mean + qnorm(0.025,0,sqrt(diag(ppt$Sigma))) #lower bound\nq2t &lt;- ppt$mean + qnorm(0.975,0,sqrt(diag(ppt$Sigma))) # upper bound\n\nNow we can plot our data and predictions and see how well our model performed. We need to back transform our predictions to the original scale.\n\n# Back transform our data to original\ngp_yy &lt;- fi(yyt)\ngp_q1 &lt;- fi(q1t)\ngp_q2 &lt;- fi(q2t)\n\n# Plot the observed points\nplot(as.Date(df$datetime), df$observation,\n       main = paste(site_names[site_number]), col = \"black\",\n       xlab = \"Dates\" , ylab = \"Abundance\",\n       # xlim = c(as.Date(min(df$datetime)), as.Date(cutoff)),\n       ylim = c(min(df_train$observation, gp_yy, gp_q1), max(df_train$observation, gp_yy, gp_q2)* 1.05))\n\n# Plot the testing set data \npoints(as.Date(df_test$datetime), df_test$observation, col =\"black\", pch = 19)\n\n# Line to indicate seperation between train and test data\nabline(v = as.Date(cutoff), lwd = 2)\n\n# Add the predicted response and the quantiles\nlines(grid_datetime, gp_yy, col = 4, lwd = 2)\nlines(grid_datetime, gp_q1, col = 4, lwd = 1.2, lty = 2)\nlines(grid_datetime, gp_q2, col = 4, lwd = 1.2, lty =2)\n\n\n\n\n\n\n\n\nThat looks pretty good? We can also look at the RMSE to see how the model performs. It is better o do this on the transformed scale. We will use yyt for this. We need to find those predictions which correspond to the datetime in our testing dataset df_test.\n\n# Obtain true observed values for testing set\nyt_true &lt;- f(df_test$observation)\n\n# FInd corresponding predictions from our model in the grid we predicted on\nyt_pred &lt;- yyt[which(grid_datetime  %in% df_test$datetime)]\n\n# calculate RMSE\nrmse &lt;- sqrt(mean((yt_true - yt_pred)^2))\nrmse\n\n[1] 0.8624903\n\n\nNext, we can attempt a hetGP.\n\n\n\nWe are now interested in fitting a vector of nuggets rather than a single value.\nLet’s use the same data we have to fit a hetGP. We already have our data (X, y) as well as our prediction set XXt. We use the mleHetGP command to fit a GP and pass in our data. The default covariance structure is the Squared Exponential structure. We use the predict function in base R and pass the hetGP object i.e. het_gpi to make predictions on our set XXt.\n\n# create predictors\nX1 &lt;- fx.iso_week(df_train$datetime)\nX2 &lt;- fx.sin(df_train$datetime)\n\n# standardize and put into matrix\nX1c &lt;- X1/53\nX &lt;- as.matrix(cbind.data.frame(X1c, X2))\n\n# Build prediction grid (From 04-2014 to 07-2025)\nXXt1 &lt;- fx.iso_week(grid_datetime)\nXXt2 &lt;- fx.sin(grid_datetime)\n\n# standardize and put into matrix\nXXt1c &lt;- XXt1/53\nXXt &lt;- as.matrix(cbind.data.frame(XXt1c, XXt2))\n\n# Transform the training response\ny_obs &lt;- df_train$observation\ny &lt;- f(y_obs)\n\n# Fit a hetGP model. X must be s matrix and nrow(X) should be same as length(y)\nhet_gpi &lt;- hetGP::mleHetGP(X = X, Z = y)\n\n# Predictions using the base R predict command with a hetGP object and new locationss\nhet_ppt &lt;- predict(het_gpi, XXt)\n\nNow we obtain the mean and the confidence bounds as well as transform the data to the original scale.\n\n# Mean density for predictive locations and Confidence bounds\nhet_yyt &lt;- het_ppt$mean\nhet_q1t &lt;- qnorm(0.975, het_ppt$mean, sqrt(het_ppt$sd2 + het_ppt$nugs))\nhet_q2t &lt;- qnorm(0.025, het_ppt$mean, sqrt(het_ppt$sd2 + het_ppt$nugs)) \n\n# Back transforming to original scale\nhet_yy &lt;- fi(het_yyt)\nhet_q1 &lt;- fi(het_q1t)\nhet_q2 &lt;- fi(het_q2t)\n\nWe can now plot the results similar to before. [Uncomment the code lines to see how a GP vs a HetGP fits the data]\n\n# Plot Original data\nplot(as.Date(df$datetime), df$observation,\n       main = paste(site_names[site_number]), col = \"black\",\n       xlab = \"Dates\" , ylab = \"Abundance\",\n       # xlim = c(as.Date(min(df$datetime)), as.Date(cutoff)),\n       ylim = c(min(df_train$observation, het_yy, het_q2), max(df_train$observation, het_yy, het_q1)* 1.2))\n\n# Add testing observations\npoints(as.Date(df_test$datetime), df_test$observation, col =\"black\", pch = 19)\n\n# Line to indicate our cutoff point\nabline(v = as.Date(cutoff), lwd = 2)\n\n# HetGP Model mean predictions and bounds.\nlines(grid_datetime, het_yy, col = 2, lwd = 2)\nlines(grid_datetime, het_q1, col = 2, lwd = 1.2, lty = 2)\nlines(grid_datetime, het_q2, col = 2, lwd = 1.2, lty =2)\n\n## GP model fits for the same data\n# lines(grid_datetime, gp_yy, col = 3, lwd = 2)\n# lines(grid_datetime, gp_q1, col = 3, lwd = 1.2, lty = 2)\n# lines(grid_datetime, gp_q2, col = 3, lwd = 1.2, lty =2)\n\nlegend(\"topleft\", legend = c(\"Train Y\",\"Test Y\", \"GP preds\", \"HetGP preds\"),\n         col = c(1, 1, 2, 3), lty = c(NA, NA, 1, 1),\n         pch = c(1, 19, NA, NA), cex = 0.5)\n\n\n\n\n\n\n\n\nThe mean predictions of a GP are similar to that of a hetGP; But the confidence bounds are different. A hetGP produces sligtly tighter bounds.\nWe can also compare the RMSE’s using the predictions of the hetGP model.\n\nyt_true &lt;- f(df_test$observation) # Original data\nhet_yt_pred &lt;- het_yyt[which(grid_datetime  %in% df_test$datetime)] # model preds\n\n# calculate rmse for hetGP model\nrmse_het &lt;- sqrt(mean((yt_true - het_yt_pred)^2))\nrmse_het\n\n[1] 0.8835813\n\n\nNow that we have learnt how to fit a GP and a hetGP, it’s time for a challenge.\nTry a hetGP on our sin example from before (but this time I have added noise).\n\n# Your turn\nset.seed(26)\nn &lt;- 8 # number of points\nX &lt;- matrix(seq(0, 2*pi, length= n), ncol=1) # build inputs \ny &lt;- 5*sin(X) + rnorm(n, 0 , 2) # response with some noise\n\n# Predict on this set\nXX &lt;- matrix(seq(-0.5, 2*pi + 0.5, length= 100), ncol=1)\n\n# Data visualization\nplot(X, y)\n\n\n\n\n\n\n\n# Add code to fit a hetGP model and visualise it as above\n\n\n\n\n\n\nFit a GP Model for the location “SERC” i.e. site_number = 7.\nUse an environmental predictor in your model. Following is a function fx.green that creates the variable given the datetime and the location.\n\nHere is a snippet of the supporting file that you will use; You can look into the data.frame and try to plot ker for one site at a time and see what it yields.\n\nsource('code/df_spline.R') # sources the cript to make greenness predictor\nhead(df_green) # how the dataset looks\n\n  site iso ker\n1 BLAN   1   0\n2 BLAN   2   0\n3 BLAN   3   0\n4 BLAN   4   0\n5 BLAN   5   0\n6 BLAN   6   0\n\n# The function to create the environmental predictor similar to iso-week and sin wave\nfx.green &lt;- function(datetime, site, site_info = df_green){\n  ker &lt;- NULL\n  iso &lt;- fx.iso_week(datetime) # identify iso week\n  df.iso &lt;- cbind.data.frame(datetime, iso) # combine date with iso week\n  sites.ker &lt;- subset(site_info, site == site)[,2:3] # obtain kernel for location\n  df.green &lt;- df.iso %&gt;% left_join(sites.ker, by = 'iso') # join dataframes by iso week\n  ker &lt;- df.green$ker # return kernel\n  return(ker)\n}\n\n\nFit a GP Model for all the locations (More advanced).\n\nHint: Write a function that can fit a GP and make predictions. Then, write a for loop where you subset the data for each location and then call the function to fit the GP."
+    "objectID": "VB_RegRev.html#sampling-distribution-of-b_1",
+    "href": "VB_RegRev.html#sampling-distribution-of-b_1",
+    "title": "VectorByte Methods Training: Regression Review",
+    "section": "Sampling distribution of b_1",
+    "text": "Sampling distribution of b_1\nIt turns out that b_1 is normally distributed: b_1 \\sim \\mathcal{N}(\\beta_1, \\sigma^2_{b_1}).\n\nb_1 is unbiased: \\mathbb{E}[b_1] = \\beta_1.\nThe sampling sd \\sigma_{b_1} determines precision of b_1: \n\\sigma_{b_1}^2\n= \\text{var}(b_1) = \\frac{\\sigma^2}{\\sum (X_i - \\bar{X})^2} = \\frac{\\sigma^2}{(n-1)s_x^2}.\n It depends on three factors: 1) sample size (n); 2) error variance (\\sigma^2 = \\sigma_\\varepsilon^2); and 3)X-spread (s_x)."
   },
   {
-    "objectID": "GP_Notes.html#gaussian-process-prior",
-    "href": "GP_Notes.html#gaussian-process-prior",
-    "title": "VectorByte Methods Training",
-    "section": "Gaussian Process Prior",
-    "text": "Gaussian Process Prior\nIn our setup, we assume that the data follows a Multivariate Normal Distribution. We can think of this as a Prior. Mathematically, we can write it as:\nY_n \\sim N \\ ( \\ \\mu \\ , \\ \\Sigma_n \\ )\nHere, Y and \\mu is an n \\times 1 vector and \\Sigma_n is a positive semi definite matrix. This means that,\nx^T \\Sigma_n x &gt; 0 \\ \\text{ for all } \\ x \\neq 0.\nFor our purposes, we will consider \\mu = 0.\nIn Simple Linear Regression, we assume \\Sigma_n = \\sigma^2 \\mathbb{I}. This means that Y_1 \\ , Y_2 \\ \\ ... \\ \\ Y_n are uncorrelated with each other. However, In a GP, we assume that there is some correlation between the responses. A common covariance function is the squared exponential kernel, which invovles the Euclidean distance i.e. for two inputs x and x', the correlation is defined as,\n\\Sigma(x, x') = \\exp \\left( \\ \\vert \\vert{x - x'} \\vert \\vert^2 \\ \\right)\nThis creates a positive semi-definite correlation kernel. It also uses the proximity of x and x' as a measure of correlation i.e. the closer two points in the input space are, the more highly their corresponding responses are correlated. We will learn the exact form of \\Sigma_n later in the tutorial. First, we need to learn about MVN Distribution and the Posterior Distribution given the data."
+    "objectID": "VB_RegRev.html#sampling-distribution-of-b_0",
+    "href": "VB_RegRev.html#sampling-distribution-of-b_0",
+    "title": "VectorByte Methods Training: Regression Review",
+    "section": "Sampling Distribution of b_0",
+    "text": "Sampling Distribution of b_0\nThe intercept is also normal and unbiased: b_0 \\sim \\mathcal{N}(\\beta_0, \\sigma^2_{b_0}), where \n\\sigma^2_{b_0} = \\text{var}(b_0)  = \\sigma^2 \\left(\\frac{1}{n} + \\frac{\\bar{X}^2}{(n-1)\n    s_x^2} \\right).\n\nWhat is the intuition here? \n\\text{var}(\\bar{Y} - \\bar{X} b_1)\n= \\text{var}(\\bar{Y}) + \\bar{X}^2\\text{var}(b_1) {~-~ 2\\mathrm{cov}(\\bar{Y},b_1) }\n\n\n\\bar{Y} and b_1 are uncorrelated because the slope (b_1) is invariant if you shift the data up or down (\\bar{Y}).\n\n\nOptional Practice Exercise\n\nShow that:\n\n\\mathbb{E}[b_1] = \\beta_1\n\\mathbb{E}[b_0] = \\beta_0\n\\text{var}(b_0) = \\sigma^2 \\left(\\frac{1}{n} + \\frac{\\bar{X}^2}{(n-1)  s_x^2} \\right)\n\nWhy is it that b_0 and b_1 are normally distributed?"
   },
   {
-    "objectID": "GP_Notes.html#multivariate-normal-distribution",
-    "href": "GP_Notes.html#multivariate-normal-distribution",
-    "title": "VectorByte Methods Training",
-    "section": "Multivariate Normal Distribution",
-    "text": "Multivariate Normal Distribution\nSuppose we have X = (X_1, X_2)\n\\begin{equation}\nX =\n\\begin{bmatrix}\nX_1 \\\\\nX_2 \\\\\n\\end{bmatrix} \\; , \\;\n\\mu =\n\\begin{bmatrix}\n\\mu_1\\\\\n\\mu_2\\\\\n\\end{bmatrix}\\; , \\;\n\\end{equation} where X_1 and \\mu_1 are q \\times 1 and X_2 and \\mu_2 are (N-q)   \\times 1.\n\\begin{equation}\n\\Sigma =\n\\begin{bmatrix}\n\\Sigma_{11} & \\Sigma_{12}\\\\\n\\Sigma_{21} &  \\Sigma_{22}\\\\\n\\end{bmatrix}\n\\; \\; \\;\n\\\\[5pt]\n\\text{with dimensions } \\; \\;\n\\begin{bmatrix}\nq \\times q & q \\times (N-q) \\\\\n(N -q) \\times q &  (N-q) \\times (N-q)\\\\\n\\end{bmatrix}\n\\;\n\\end{equation}\nThen, we have\n\\begin{equation}\n\\begin{bmatrix}\nX_1 \\\\\nX_2 \\\\\n\\end{bmatrix}\n\\ \\sim \\ \\mathcal{N}\n\\left(\n\\;\n\\begin{bmatrix}\n\\mu_1 \\\\\n\\mu_2 \\\\\n\\end{bmatrix}\\; , \\;\n\\begin{bmatrix}\n\\Sigma_{11} & \\Sigma_{12}\\\\\n\\Sigma_{21} &  \\Sigma_{22}\\\\\n\\end{bmatrix}\n\\;\n\\right)\n\\\\[5pt]\n\\end{equation}\nNow we can derive the conditional distribution of X_1 \\vert X_2 using properties of MVN.\nX_1 \\vert X_2 \\ \\sim \\mathcal{N} (\\mu_{X_1 \\vert X_2}, \\ \\Sigma_{X_1 \\vert X_2})\nwhere,\n\\mu_{X_1 \\vert X_2} = \\mu_1 + \\Sigma_{12}\\Sigma_{22}^{-1}(x_2 - \\mu_2)\n\\Sigma_{X_1 \\vert X_2} = \\Sigma_{11} - \\Sigma_{12}\\Sigma_{22}^{-1} \\Sigma_{21}\nNow, let’s look at this in our context.\nSuppose we have, D_n = (X_n, Y_n) where Y_n \\sim N \\ ( \\ 0 \\ , \\ \\Sigma_n \\ ). Now, for a new location x_p, we need to find the distribution ofY(x_p).\nWe want to find the distribution of Y(x_p) \\ \\vert \\ D_n. Using the information from above, we know this is normally distributed and we need to identify then mean and variance. Thus, we have\n\\begin{equation}\n\\begin{aligned}\nY(x_p) \\vert \\ D_n \\ & \\sim \\mathcal{N} \\left(\\mu(x_p) \\ , \\ \\sigma^2(x_p) \\right) \\; \\; \\text{where, }\\\\[3pt]\n\\mu(x_p) \\ & = \\Sigma(x_p, X_n) \\Sigma_n^{-1}Y_n \\; \\;\\\\[3pt]\n\\sigma^2(x_p) \\ & = \\Sigma(x_p, x_p) - \\Sigma(x_p, X_n) \\Sigma_n^{-1}\\Sigma(X_n, x_p) \\\\[3pt]\n\\end{aligned}\n\\end{equation}"
+    "objectID": "VB_RegRev.html#joint-distribution-of-b_0-and-b_1",
+    "href": "VB_RegRev.html#joint-distribution-of-b_0-and-b_1",
+    "title": "VectorByte Methods Training: Regression Review",
+    "section": "Joint Distribution of b_0 and b_1",
+    "text": "Joint Distribution of b_0 and b_1\nWe know that b_0 and b_1 can be dependent, i.e., \n\\mathbb{E}[(b_0 -\\beta_0)(b_1 - \\beta_1)] \\ne 0.\n This means that estimation error in the slope is correlated with the estimation error in the intercept. \n\\mathrm{cov}(b_0,b_1) = -\\sigma^2 \\left(\\frac{\\bar{X}}{(n-1)s_x^2}\\right).\n\n\nInterpretation:\n\nUsually, if the slope estimate is too high, the intercept estimate is too low (negative correlation).\nThe correlation decreases with more X spread (s^2_x)."
   },
   {
-    "objectID": "GP_Notes.html#example-gp-for-toy-example",
-    "href": "GP_Notes.html#example-gp-for-toy-example",
-    "title": "VectorByte Methods Training",
-    "section": "Example: GP for Toy Example",
-    "text": "Example: GP for Toy Example\nSuppose we have data from the following function, Y(x) = 5 \\ \\sin (x)\nNow we use the above, and try and obtain Y(x_p) \\vert Y. Here is a visual of what a GP prediction for this function looks like. Each gray line is a draw from our predicted normal distribution, the blue line is the truth and the black line is the mean prediction from our GP. The red lines are confidence bounds. Pretty good? Let’s learn how we do that."
+    "objectID": "VB_RegRev.html#estimated-variance",
+    "href": "VB_RegRev.html#estimated-variance",
+    "title": "VectorByte Methods Training: Regression Review",
+    "section": "Estimated variance",
+    "text": "Estimated variance\nHowever, these formulas aren’t especially practical since they involve an unknown quantity: \\sigma.\n\nSolution: use s, the residual sample standard deviation estimator for \\sigma = \\sigma_\\varepsilon. \ns_{b_1} = \\sqrt{\\frac{s^2}{(n-1)s_x^2}} ~~~\ns_{b_0} = \\sqrt{s^2 \\left(\\frac{1}{n} + \\frac{\\bar{X}^2}{(n-1)s^2_x}\\right)}\n\ns_{b_1} = \\hat{\\sigma~}_{b_1} and s_{b_0} = \\hat{\\sigma~}_{b_0} are estimated coefficient sd’s.\n\n\nInterpretation:\n\nWe now have a notion of standard error for the LS estimates of the slope and intercept.\n\n\nSmall s_b values mean high info/precision/accuracy."
   },
   {
-    "objectID": "GP_Notes.html#covariance-function",
-    "href": "GP_Notes.html#covariance-function",
-    "title": "VectorByte Methods Training",
-    "section": "Covariance Function",
-    "text": "Covariance Function\nAs mentioned before, the main action is in the specification of \\Sigma_n. Let’s express \\Sigma_n = \\tau^2 C_n where C_n is the correlation function. We will be using the squared exponential distance based correlation function. The kernel can be written down mathematically as,\nC_n = \\exp{ \\left( -\\frac{\\vert\\vert x - x' \\vert \\vert ^2}{\\theta} \\right ) + g \\mathbb{I_n}} \nHere, if x and x' are closer in distance, the responses are more highly correlated. Along with our input space we also notice three other paramters; which in this context are referred to as hyper-parameters as they are used for fine-tuning our predictions as opposed to directly affecting them.\nWe have three main hyper-parameters here:\n\n\\tau^2: Scale\nThis parameter dictates the amplitude of our function. A MVN Distribution with scale = 1 will usually have data between -2 to 2. As the scale increases, this range expands. Here is a plo that shows two different scales for the same function, with all other parameters fixed.\n\nlibrary(mvtnorm)\nlibrary(laGP)\n\nset.seed(24)\nn &lt;- 100\nX &lt;- as.matrix(seq(0, 20, length.out = n))\nDx &lt;- laGP::distance(X)\n\ng &lt;- sqrt(.Machine$double.eps)\nCn &lt;- (exp(-Dx) + diag(g, n))\n\nY &lt;- rmvnorm(1, sigma = Cn)\n\nset.seed(28)\ntau2 &lt;- 25\nY_scaled &lt;- rmvnorm(1, sigma = tau2 * Cn)\n\npar(mfrow = c(1, 2), mar = c(5, 5, 4, 2), cex.axis = 2, cex.lab = 2, cex.main = 3, font.lab = 2)\n\n# Plot 1\nmatplot(X, t(Y), type = 'l', main = expression(paste(tau^2, \" = 1\")), \n        ylab = \"Y\", xlab = \"X\", lwd = 2, col = \"blue\")\n\n# Plot 2\nmatplot(X, t(Y_scaled), type = 'l', main = expression(paste(tau^2, \" = 25\")), \n        ylab = \"Y\", xlab = \"X\", lwd = 2, col = \"red\")\n\n\n\n\n\n\n\n\n\n\n\\theta: Length-scale\nThe length-scale controls the wiggliness of the function. It is also referred to as the rate of decay of correlation. The smaller it’s value, the more wiggly the function gets. This is because we expect the change in directionalilty of the function to be rather quick. We will once again demonstrate how a difference in magnitude of \\theta affects the function, keeping everything else constant.\n\nset.seed(1)\nn &lt;- 100\nX &lt;- as.matrix(seq(0, 10, length.out = n))\nDx &lt;- laGP::distance(X)\n\ng &lt;- sqrt(.Machine$double.eps)\ntheta1 &lt;- 0.5\nCn &lt;- (exp(-Dx/theta1) + diag(g, n))\n\nY &lt;- rmvnorm(1, sigma = Cn)\n\ntheta2 &lt;- 5\nCn &lt;- (exp(-Dx/theta2) + diag(g, n))\n\nY2 &lt;- rmvnorm(1, sigma = Cn)\n\npar(mfrow = c(1, 2), mar = c(5, 5, 4, 2), cex.axis = 2, cex.lab = 2, cex.main = 3, font.lab = 2)\nmatplot(X, t(Y), type= 'l', main = expression(paste(theta, \" = 0.5\")),\n     ylab = \"Y\", ylim = c(-2.2, 2.2), lwd = 2, col = \"blue\")\nmatplot(X, t(Y2), type= 'l',  main = expression(paste(theta, \" = 5\")),\n     ylab = \"Y\", ylim = c(-2.2, 2.2), lwd = 2, col = \"red\")\n\n\n\n\n\n\n\n\nAn extenstion: Anisotropic GP\nIn a multi-dimensional input setup, where X_{n \\times m} = (\\underline{X}_1, ... \\underline{X}_m). Here, the input space is m-dimensional and we have n observations. We can adjust the kernel so that each dimension has it’s own \\theta i.e. the rate of decay of correlation is different from one dimension to another. This can be done by simply modifying the correlation function, and writing it as,\nC_n = \\exp{ \\left( - \\sum_{k=1}^{m}  \\frac{\\vert\\vert x - x' \\vert \\vert ^2}{\\theta_k} \\right ) + g \\mathbb{I_n}} \nThis type of modelling is also referred to a seperable GP since we can take the sum outside the exponent and it will be a product of m independent dimensions. If we set all \\theta_k= \\theta, it would be an isotropic GP.\n\n\ng: Nugget\nThis parameter adds some noise into the function. For g &gt; 0, it determines the magnitude of discontinuity as x' tends to x. It is also called the nugget effect. For g=0, there would be no noise and the function would interpolate between the points. This effect is only added to the diagonals of the correlation matrix. We never add g to the off-diagonal elements. This also allows for numeric stability. Below is a snippet of what different magnitudes of g look like.\n\nlibrary(mvtnorm)\nlibrary(laGP)\n\nn &lt;- 100\nX &lt;- as.matrix(seq(0, 10, length.out = n))\nDx &lt;- laGP::distance(X)\n\ng &lt;- sqrt(.Machine$double.eps)\nCn &lt;- (exp(-Dx) + diag(g, n))\nY &lt;- rmvnorm(1, sigma = Cn)\n\nCn &lt;- (exp(-Dx) + diag(1e-2, n))\n\nL &lt;- rmvnorm(1, sigma = diag(1e-2, n))\nY2 &lt;- Y + L\n\npar(mfrow = c(1, 2), mar = c(5, 5, 4, 2), cex.axis = 2, cex.lab = 2, cex.main = 3, font.lab = 2)\nplot(X, t(Y), main = expression(paste(g, \" &lt; 1e-8\")),\n     ylab = \"Y\", xlab = \"X\", pch = 19, cex = 1.5, col = 1)\nlines(X, t(Y), col = \"blue\", lwd = 3) \n\nplot(X, t(Y2), main = expression(paste(g, \" = 0.01\")),\n     ylab = \"Y\", xlab = \"X\", pch = 19, cex = 1.5, col = 1)\nlines(X, t(Y), col = \"blue\", lwd = 3)\n\n\n\n\n\n\n\n\nAn extension: Heteroskedastic GP\nWe will study this in some detail later, but here instead of using one nugget g for the entire model, we use a vector of nuggets \\Lambda; one unique nugget for each unique input i.e. simply put, a different value gets added to each diagonal element.\nBack to GP fitting\nFor now, let’s get back to GP and fitting and learn how to use it. We have already seen a small example of the laGP package in action. However, we had not used any of the hyper-parameters in that case. We assumed to know all the information. However, that is not always the case. Without getting into the nitty-gritty details, here is how we obtain our parameters when we have some real data D_n = (X_n, Y_n).\n\ng and \\theta: An estimate can be obtained using MLE method by maximizing the likelihood. This is done using numerical algorithms.\n\\tau^2: An estimate is obtained as a closed form solution once we plug in g."
+    "objectID": "VB_RegRev.html#normal-and-student-t",
+    "href": "VB_RegRev.html#normal-and-student-t",
+    "title": "VectorByte Methods Training: Regression Review",
+    "section": "Normal and Student-t",
+    "text": "Normal and Student-t\nAgain, recall what Student discovered:\nIf \\theta \\sim \\mathcal{N}(\\mu,\\sigma^2), but you estimate \\sigma^2 \\approx s^2 based on n-p degrees of freedom, then \\theta \\sim t_{n-p}(\\mu, s^2).\n\nFor SLR, for example:\n\n\\bar{Y} \\sim t_{n-1}(\\mu, s_y^2/n).\nb_0 \\sim t_{n-2}\\left(\\beta_0, s^2_{b_0}\\right) and b_1 \\sim t_{n-2}\\left(\\beta_1, s^2_{b_1}\\right)\n\n\nWe can use these distributions for drawing conclusions about the parameters via:\n\nConfidence intervals\nHypothesis tests"
   },
   {
-    "objectID": "GP_Notes.html#gaussian-processes",
-    "href": "GP_Notes.html#gaussian-processes",
-    "title": "VectorByte Methods Training",
+    "objectID": "Stats_review.html",
+    "href": "Stats_review.html",
+    "title": "VectorByte Methods Training: Probability and Statistics Fundamentals",
     "section": "",
-    "text": "A Gaussian Process (GP) is a non-parameteric and flexible method to model data. Here, we assume that the data follow a Multivariate Normal Distribution. It is widely used in the fields of spatial statistics commonly known as kriging as well as machine learning as a surrogate model due to it’s ability of making fast predictions with good uncertainty quantification.\nIn spatial statistics, we want to emphasize the relationship between the distance of different locations along with the response of interest. A GP allows us to do that as we will see in this tutorial. A different application of a GP involves it’s usage as a surrogate. A surrogate model is used to approximate a computer model and/or field experiments where running the experiments may be cost or time ineffective and/or infeasible.\nFor e.g. Suppose we wish to estimate the amount of energy released when a bomb explodes. Conducting this experiment repeatedly a large number of times to collect data seems infeasible. In such cases, we can use a surrogate model to the field data and make predictions for different input locations.\nIn the field of ecology, as we will see in this tutorial, we will use a Gaussian Process model as a Non-Parametric Regression tool, similar to Linear Regression. We will assume our data follows a GP, and use Bayesian Methods to infer the distribution of new locations given the data. The predictions obtained will have good uncertainty quantification which is ofcourse valuable in this field due to the noisy nature of our data."
+    "text": "Main materials\nSolutions to exercises"
   },
   {
-    "objectID": "GP_Practical.html#overview-of-the-data",
-    "href": "GP_Practical.html#overview-of-the-data",
-    "title": "VectorByte Methods Training",
-    "section": "Overview of the Data",
-    "text": "Overview of the Data\n\nObjective: Forecast tick density for 4 weeks into the future\nSites: The data is collected across 9 different sites, each plot was of size 1600m^2 using a drag cloth\nData: Sparse and irregularly spaced. We only have ~650 observations across 10 years at 9 locations\n\nLet’s start with loading all the libraries that we will need, load our data and understand what we have.\n\nlibrary(tidyverse)\nlibrary(laGP)\nlibrary(ggplot2)\n\n# Pulling the data from the NEON data base. \ntarget &lt;- readr::read_csv(\"https://data.ecoforecast.org/neon4cast-targets/ticks/ticks-targets.csv.gz\", guess_max = 1e1)\n\n# Visualizing the data\nhead(target)\n\n# A tibble: 6 × 5\n  datetime   site_id variable             observation iso_week\n  &lt;date&gt;     &lt;chr&gt;   &lt;chr&gt;                      &lt;dbl&gt; &lt;chr&gt;   \n1 2015-04-20 BLAN    amblyomma_americanum        0    2015-W17\n2 2015-05-11 BLAN    amblyomma_americanum        9.82 2015-W20\n3 2015-06-01 BLAN    amblyomma_americanum       10    2015-W23\n4 2015-06-08 BLAN    amblyomma_americanum       19.4  2015-W24\n5 2015-06-22 BLAN    amblyomma_americanum        3.14 2015-W26\n6 2015-07-13 BLAN    amblyomma_americanum        3.66 2015-W29"
+    "objectID": "Stats_review.html#some-probability-notation",
+    "href": "Stats_review.html#some-probability-notation",
+    "title": "VectorByte Methods Training: Probability and Statistics Fundamentals",
+    "section": "Some probability notation",
+    "text": "Some probability notation\nWe have a set, S of all possible events. Let \\text{Pr}(A) (or alternatively \\text{Prob}(A)) be the probability of event A. Then:\n\nA^c is the complement to A (all events that are not A).\nA \\cup B is the union of events A and B (“A or B”).\nA \\cap B is the intersection of events A and B (“A and B”).\n\\text{Pr}(A|B) is the conditional probability of A given that B occurs."
   },
   {
-    "objectID": "GP_Practical.html#initial-setup",
-    "href": "GP_Practical.html#initial-setup",
-    "title": "VectorByte Methods Training",
-    "section": "Initial Setup",
-    "text": "Initial Setup\n\nFor a GP model, we assume the response (Y) should be normally distributed.\nSince tick density, our response, must be greater than 0, we need to use a transform.\nThe following is the most suitable transform for our application:\n\n\n\\begin{equation}\n\\begin{aligned}\nf(y) \\ & = \\text{log } \\ (y + 1) \\ \\ ; \\ \\ \\ \\\\[2pt]\n&lt;!-- \\ & = \\sqrt{y} \\ \\ \\ \\; \\ \\ \\ otherwise --&gt;\n\\end{aligned}\n\\end{equation}\nWe pass in (response + 1) into this function to ensure we don’;t take a log of 0. We will adjust this in our back transform.\nLet’s write a function for this, as well as the inverse of the transform.\n\n# transforms y\nf &lt;- function(x) {\n  y &lt;- log(x + 1)\n  return(y)\n}\n\n# This function back transforms the input argument\nfi &lt;- function(y) {\n  x &lt;- exp(y) - 1\n  return(x)\n}"
+    "objectID": "Stats_review.html#axioms-of-probability",
+    "href": "Stats_review.html#axioms-of-probability",
+    "title": "VectorByte Methods Training: Probability and Statistics Fundamentals",
+    "section": "Axioms of Probability",
+    "text": "Axioms of Probability\nThese are the basic definitions that we use when we talk about probabilities. You’ve probably seen these before, but maybe not in mathematical notation. If the notation is new to you, I suggest that you use the notation above to translate these statements into words and confirm that you understand what they mean. I give you an example for the first statement.\n\n\\sum_{i \\in S} \\text{Pr}(A_i)=1, where 0 \\leq \\text{Pr}(A_i) \\leq 1 (the probabilities of all the events that can happen must sum to one, and all of the individual probabilities must be less than one)\n\\text{Pr}(A)=1-\\text{Pr}(A^c)\n\\text{Pr}(A \\cup B) = \\text{Pr}(A) + \\text{Pr}(B) -\\text{Pr}(A \\cap B)\n\\text{Pr}(A \\cap B) = \\text{Pr}(A|B)\\text{Pr}(B)\nIf A and B are independent, then \\text{Pr}(A|B) = \\text{Pr}(A)"
   },
   {
-    "objectID": "GP_Practical.html#predictors",
-    "href": "GP_Practical.html#predictors",
-    "title": "VectorByte Methods Training",
-    "section": "Predictors",
-    "text": "Predictors\n\nThe goal is to forecast tick populations for a season so our response (Y) here, is the tick density. However, we do not have a traditional data set with an obvious input space. What is the X? \n\nWe made a few plots earlier to help us identify what can be useful:\n\nX_1 Iso-week: This is the iso-week number\nLet’s convert the iso-week from our target dataset as a numeric i.e. a number. Here is a function to do the same.\n\n# This function tells us the iso-week number given the date\nfx.iso_week &lt;- function(datetime){\n  # Gives ISO-week in the format yyyy-w## and we extract the ##\n  x1 &lt;- as.numeric(stringr::str_sub(ISOweek::ISOweek(datetime), 7, 8)) # find iso week #\n  return(x1)\n}\n\ntarget$week &lt;- fx.iso_week(target$datetime)\nhead(target)\n\n# A tibble: 6 × 6\n  datetime   site_id variable             observation iso_week  week\n  &lt;date&gt;     &lt;chr&gt;   &lt;chr&gt;                      &lt;dbl&gt; &lt;chr&gt;    &lt;dbl&gt;\n1 2015-04-20 BLAN    amblyomma_americanum        0    2015-W17    17\n2 2015-05-11 BLAN    amblyomma_americanum        9.82 2015-W20    20\n3 2015-06-01 BLAN    amblyomma_americanum       10    2015-W23    23\n4 2015-06-08 BLAN    amblyomma_americanum       19.4  2015-W24    24\n5 2015-06-22 BLAN    amblyomma_americanum        3.14 2015-W26    26\n6 2015-07-13 BLAN    amblyomma_americanum        3.66 2015-W29    29\n\n\n\nX_2 Sine wave: We use this to give our model phases. We can consider this as a proxy to some other variables such as temperature which would increase from Jan to about Jun-July and then decrease. We use the following sin wave\n\nX_2 = \\left( \\text{sin} \\ \\left( \\frac{2 \\ \\pi \\ X_1}{106} \\right) \\right)^2 where, X_1 is the iso-week.\nUsually, a Sin wave for a year would have the periodicity of 53 to indicate 53 weeks. Why have we chosen 106 as our period? And we do we square it?\nLet’s use a visual to understand that.\n\nx &lt;- c(1:106)\nsin_53 &lt;- sin(2*pi*x/53)\nsin_106 &lt;- (sin(2*pi*x/106))\nsin_106_2 &lt;- (sin(2*pi*x/106))^2\n\npar(mfrow=c(1, 3), mar = c(4, 5, 4, 1), cex.axis = 2, cex.lab = 2, cex.main = 3, font.lab = 2)\nplot(x, sin_53, col = 2, pch = 19, ylim = c(-1, 1), ylab = \"sin wave\", main = \"period = 53\")\nabline(h = 0, lwd = 2)\nplot(x, sin_106, col = 3, pch = 19, ylim = c(-1, 1), ylab = \"sin wave\", main = \"period = 106\")\nabline(h = 0, lwd = 2)\nplot(x, sin_106_2, col = 4, pch = 19, ylim = c(-1, 1), ylab = \"sin wave\", main = \"period = 106 squared\")\nabline(h = 0, lwd = 2)\n\n\n\n\n\n\n\n\nSome observations:\n\nThe sin wave (period 53) goes increases from (0, 1) and decreases all the way to -1 before coming back to 0, all within the 53 weeks in the year. But this is not what we want to achieve.\nWe want the function to increase from Jan - Jun and then start decreasing till Dec. This means, we need a regular sin-wave to span 2 years so we can see this.\nWe also want the next year to repeat the same pattern i.e. we want to restrict it to [0, 1] interval. Thus, we square the sin wave.\n\n\nfx.sin &lt;- function(datetime, f1 = fx.iso_week){\n  # identify iso week#\n  x &lt;- f1(datetime) \n  # calculate sin value for that week\n  x2 &lt;- (sin(2*pi*x/106))^2 \n  return(x2)\n}\n\nFor a GP, it’s also useful to ensure that all our X’s are between 0 and 1. Usually this is done by using the following method\nX_i^* = \\frac{X_i - \\min(X)}{\\max(X) - \\min(X) } where X = (X_1, X_2 ...X_n)\nX^* = (X_1^*, X_2^* ... X_n^*) will be the standarized X’s with all X_i^* in the interval [0, 1].\nWe can either write a function for this, or in our case, we can just divide Iso-week by 53 since that would result effectively be the same. Our Sin Predictor already lies in the interval [0, 1]."
+    "objectID": "Stats_review.html#bayes-theorem",
+    "href": "Stats_review.html#bayes-theorem",
+    "title": "VectorByte Methods Training: Probability and Statistics Fundamentals",
+    "section": "Bayes Theorem",
+    "text": "Bayes Theorem\nBayes Theorem allows us to related the conditional probabilities of two events A and B:\n\\begin{align*}\n\\text{Pr}(A|B) & = \\frac{\\text{Pr}(B|A)\\text{Pr}(A)}{\\text{Pr}(B)}\\\\\n&\\\\\n& =  \\frac{\\text{Pr}(B|A)\\text{Pr}(A)}{\\text{Pr}(B|A)\\text{Pr}(A) + \\text{Pr}(B|A^c)\\text{Pr}(A^c)}\n\\end{align*}"
   },
   {
-    "objectID": "GP_Practical.html#model-fitting",
-    "href": "GP_Practical.html#model-fitting",
-    "title": "VectorByte Methods Training",
-    "section": "Model Fitting",
-    "text": "Model Fitting\nNow, let’s start with modelling. We will start with one random location out of the 9 locations.\n\n# Choose a random site number: Anything between 1-9.\nsite_number &lt;- 6\n\n# Obtaining site name\nsite_names &lt;- unique(target$site_id)\n\n# Subsetting all the data at that location\ndf &lt;- subset(target, target$site_id == site_names[site_number])\nhead(df)\n\n# A tibble: 6 × 6\n  datetime   site_id variable             observation iso_week  week\n  &lt;date&gt;     &lt;chr&gt;   &lt;chr&gt;                      &lt;dbl&gt; &lt;chr&gt;    &lt;dbl&gt;\n1 2014-06-09 SCBI    amblyomma_americanum       75.9  2014-W24    24\n2 2014-06-30 SCBI    amblyomma_americanum       28.3  2014-W27    27\n3 2014-07-21 SCBI    amblyomma_americanum        0    2014-W30    30\n4 2014-07-28 SCBI    amblyomma_americanum       10.1  2014-W31    31\n5 2014-08-11 SCBI    amblyomma_americanum        4.94 2014-W33    33\n6 2014-10-20 SCBI    amblyomma_americanum        0    2014-W43    43\n\n\nWe will also select only those columns that we are interested in i.e. datetime and obervation. We don’t need site since we are only using one of them.\n\n# extracting only the datetime and obs columns\ndf &lt;- df[, c(\"datetime\", \"observation\")]\n\nWe will use one site at first and fit a GP and make predictions. For this we first need to divide our data into a training set and a testing set. Since we have time series, we want to divide the data sequentially, i.e. we pick a date and everything before the date is our training set and after is our testing set where we check how well our model performs. We choose the date 2020-12-31.\n\n# Selecting a date before which we consider everything as training data and after this is testing data.\ncutoff = as.Date('2020-12-31')\ndf_train &lt;- subset(df, df$datetime &lt;= cutoff)\ndf_test &lt;- subset(df, df$datetime &gt; cutoff)"
+    "objectID": "Stats_review.html#discrete-rvs-and-their-probability-distributions",
+    "href": "Stats_review.html#discrete-rvs-and-their-probability-distributions",
+    "title": "VectorByte Methods Training: Probability and Statistics Fundamentals",
+    "section": "Discrete RVs and their Probability Distributions",
+    "text": "Discrete RVs and their Probability Distributions\nMany things that we observe are naturally discrete. For instance, whole numbers of chairs or win/loss outcomes for games. Discrete probability distributions are used to describe these kinds of events.\nFor discrete RVs, the distribution of probabilities is described by the probability mass function (pmf), f_k such that:\n\\begin{align*}\nf_k  \\equiv \\text{Pr}(X & = k) \\\\\n\\text{where } 0\\leq f_k \\leq 1 & \\text{ and } \\sum_k f_k = 1\n\\end{align*}\nFor example, for a fair 6-sided die:\nf_k = 1/6 for k= \\{1,2,3,4,5,6\\}.\n\\star Question 1: For the six-sided fair die, what is f_k if k=7? k=1.5?\nRelated to the pmf is the cumulative distribution function (cdf), F(x). F(x) \\equiv \\text{Pr}(X \\leq x)\nFor the 6-sided die F(x)= \\displaystyle\\sum_{k=1}^{x} f_k\nwhere x \\in 1\\dots 6.\n\\star Question 2: For the fair 6-sided die, what is F(3)? F(7)? F(1.5)?\n\nVisualizing distributions of discrete RVs in R\nExample: Imagine a RV can take values 1 through 10, each with probability 0.1:\n \n\nvals&lt;-seq(1,10, by=1)\npmf&lt;-rep(0.1, 10)\ncdf&lt;-pmf[1]\nfor(i in 2:10) cdf&lt;-c(cdf, cdf[i-1]+pmf[i])\npar(mfrow=c(1,2), bty=\"n\")\nbarplot(height=pmf, names.arg=vals, ylim=c(0, 1), main=\"pmf\", col=\"blue\")\nbarplot(height=cdf, names.arg=vals, ylim=c(0, 1), main=\"cdf\", col=\"red\")"
   },
   {
-    "objectID": "GP_Practical.html#gp-model",
-    "href": "GP_Practical.html#gp-model",
-    "title": "VectorByte Methods Training",
-    "section": "GP Model",
-    "text": "GP Model\nNow we will setup our X’s. We already have the functions to do this and can simply pass in the datetime. We then combine X_1 and X_2 to create out input matrix X. Remember, everything is ordered as in our dataset.\n\n# Setting up iso-week and sin wave predictors by calling the functions\nX1 &lt;- fx.iso_week(df_train$datetime) # range is 1-53\nX2 &lt;- fx.sin(df_train$datetime) # range is 0 to 1\n\n# Centering the iso-week by diving by 53\nX1c &lt;- X1/ 53\n\n# We combine columns centered X1 and X2, into a matrix as our input space\nX &lt;- as.matrix(cbind.data.frame(X1c, X2))\nhead(X)\n\n           X1c        X2\n[1,] 0.4528302 0.9782005\n[2,] 0.5094340 0.9991219\n[3,] 0.5660377 0.9575728\n[4,] 0.5849057 0.9305218\n[5,] 0.6226415 0.8587536\n[6,] 0.8113208 0.3120862\n\n\nNext step is to tranform the response to ensure it is normal.\n\n# Extract y: observation from our training model. \ny_obs &lt;- df_train$observation\n\n# Transform the response\ny &lt;- f(y_obs)\n\nNow, we can use the laGP library to fit a GP. First, we specify priors using darg and garg. We will specify a minimum and maximum for our arguments. We need to pass the input space for darg and the output vector for garg. You can look into the functions using ?function in R. We set the minimum to a very small value rather than 0 to ensure numeric stability.\n\n# A very small value for stability\neps &lt;- sqrt(.Machine$double.eps) \n  \n# Priors for theta and g. \nd &lt;- darg(list(mle=TRUE, min =eps, max=5), X)\ng &lt;- garg(list(mle=TRUE, min = eps, max = 1), y)\n\nNow, to fit the GP, we use newGPsep. We pass the input matrix and the response vector with some values of the parameters. Then, we use the jmleGPsep function to jointly estimate \\theta and g using MLE method. dK allows the GP object to store derivative information which is needed for MLE calculations. newGPsep will fit a separable GP as opposed to newGP which would fit an isotropic GP.\n\n# Fitting a GP with our data, and some starting values for theta and g\ngpi &lt;- newGPsep(X, y, d = 0.1, g = 1, dK = T)\n\n# Jointly infer MLE for all parameters\nmle &lt;- jmleGPsep(gpi, drange = c(d$min, d$max), grange = c(g$min, g$max), \n                 dab = d$ab, gab=  g$ab)\n\nNow, we will create a grid from the first week in our dataset to 1 year into the future, and predict on the entire time series. We use predGPsep to make predictions.\n\n# Create a grid from start date in our data set to one year in future (so we forecast for next season)\nstartdate &lt;- as.Date(min(df$datetime))# identify start week\ngrid_datetime &lt;- seq.Date(startdate, Sys.Date() + 365, by = 7) # create sequence from \n\n# Build the inpu space for the predictive space (All weeks from 04-2014 to 07-2025)\nXXt1 &lt;- fx.iso_week(grid_datetime)\nXXt2 &lt;- fx.sin(grid_datetime)\n\n# Standardize\nXXt1c &lt;- XXt1/53\n\n# Store inputs as a matrix\nXXt &lt;- as.matrix(cbind.data.frame(XXt1c, XXt2))\n\n# Make predictions using predGP with the gp object and the predictive set\nppt &lt;- predGPsep(gpi, XXt) \n\nStoring the mean and calculating quantiles.\n\n# Now we store the mean as our predicted response i.e. density along with quantiles\nyyt &lt;- ppt$mean\nq1t &lt;- ppt$mean + qnorm(0.025,0,sqrt(diag(ppt$Sigma))) #lower bound\nq2t &lt;- ppt$mean + qnorm(0.975,0,sqrt(diag(ppt$Sigma))) # upper bound\n\nNow we can plot our data and predictions and see how well our model performed. We need to back transform our predictions to the original scale.\n\n# Back transform our data to original\ngp_yy &lt;- fi(yyt)\ngp_q1 &lt;- fi(q1t)\ngp_q2 &lt;- fi(q2t)\n\n# Plot the observed points\nplot(as.Date(df$datetime), df$observation,\n       main = paste(site_names[site_number]), col = \"black\",\n       xlab = \"Dates\" , ylab = \"Abundance\",\n       # xlim = c(as.Date(min(df$datetime)), as.Date(cutoff)),\n       ylim = c(min(df_train$observation, gp_yy, gp_q1), max(df_train$observation, gp_yy, gp_q2)* 1.05))\n\n# Plot the testing set data \npoints(as.Date(df_test$datetime), df_test$observation, col =\"black\", pch = 19)\n\n# Line to indicate seperation between train and test data\nabline(v = as.Date(cutoff), lwd = 2)\n\n# Add the predicted response and the quantiles\nlines(grid_datetime, gp_yy, col = 4, lwd = 2)\nlines(grid_datetime, gp_q1, col = 4, lwd = 1.2, lty = 2)\nlines(grid_datetime, gp_q2, col = 4, lwd = 1.2, lty =2)\n\n\n\n\n\n\n\n\nThat looks pretty good? We can also look at the RMSE to see how the model performs. It is better o do this on the transformed scale. We will use yyt for this. We need to find those predictions which correspond to the datetime in our testing dataset df_test.\n\n# Obtain true observed values for testing set\nyt_true &lt;- f(df_test$observation)\n\n# FInd corresponding predictions from our model in the grid we predicted on\nyt_pred &lt;- yyt[which(grid_datetime  %in% df_test$datetime)]\n\n# calculate RMSE\nrmse &lt;- sqrt(mean((yt_true - yt_pred)^2))\nrmse\n\n[1] 0.8624903"
+    "objectID": "Stats_review.html#continuous-rvs-and-their-probability-distributions",
+    "href": "Stats_review.html#continuous-rvs-and-their-probability-distributions",
+    "title": "VectorByte Methods Training: Probability and Statistics Fundamentals",
+    "section": "Continuous RVs and their Probability Distributions",
+    "text": "Continuous RVs and their Probability Distributions\nThings are just a little different for continuous RVs. Instead we use the probability density function (pdf) of the RV, and denote it by f(x). It still describes how relatively likely are alternative values of an RV – that is, if the pdf his higher around one value than around another, then the first is more likely to happen. However, the pdf does not return a probability, it is a function that describes the probability density.\nAn analogy:\nProbabilities are like weights of objects. The PMF tells you how much weight each possible value or outcome contributes to a whole. The PDF tells you how dense it is around a value. To calculate the weight of a real object, you need to also know the size of the area that you’re interested in and the density there The probability that your RV takes exactly any value is zero, just like the probability that any atom in a very thin wire is lined up at exactly that position is zero (and to the amount of mass at that location is zero). However, you can take a very thin slice around that location to see how much material is there.\nRelated to the pdf is the cumulative distribution function (cdf), F(x). \nF(x) \\equiv \\text{Pr}(X \\leq x)\n For a continuous distribution: \nF(x)= \\int_{-\\infty}^x f(x')dx'\n\n \n For a normal distribution with mean 0, what is F(0)?\n \n\nVisualizing distributions of continuous RVs in R\nExample: exponential RV, where f(x) = re^{-rx}:\n\n\nvals&lt;-seq(0,10, length=1000)\nr&lt;-0.5\npar(mfrow=c(1,2), bty=\"n\")\nplot(vals, dexp(vals, rate=r), main=\"pdf\", col=\"blue\", type=\"l\", lwd=3, ylab=\"\", xlab=\"\")\nplot(vals, pexp(vals, rate=r), main=\"cdf\", ylim=c(0,1), col=\"red\",\n     type=\"l\", lwd=3, ylab=\"\", xlab=\"\")"
   },
   {
-    "objectID": "GP_Practical.html#hetgp-model",
-    "href": "GP_Practical.html#hetgp-model",
-    "title": "VectorByte Methods Training",
-    "section": "HetGP Model",
-    "text": "HetGP Model\nNext, we can attempt a hetGP. We are now interested in fitting a vector of nuggets rather than a single value.\nLet’s use the same data we have to fit a hetGP. We already have our data (X, y) as well as our prediction set XXt. We use the mleHetGP command to fit a GP and pass in our data. The default covariance structure is the Squared Exponential structure. We use the predict function in base R and pass the hetGP object i.e. het_gpi to make predictions on our set XXt.\n\n# create predictors\nX1 &lt;- fx.iso_week(df_train$datetime)\nX2 &lt;- fx.sin(df_train$datetime)\n\n# standardize and put into matrix\nX1c &lt;- X1/53\nX &lt;- as.matrix(cbind.data.frame(X1c, X2))\n\n# Build prediction grid (From 04-2014 to 07-2025)\nXXt1 &lt;- fx.iso_week(grid_datetime)\nXXt2 &lt;- fx.sin(grid_datetime)\n\n# standardize and put into matrix\nXXt1c &lt;- XXt1/53\nXXt &lt;- as.matrix(cbind.data.frame(XXt1c, XXt2))\n\n# Transform the training response\ny_obs &lt;- df_train$observation\ny &lt;- f(y_obs)\n\n# Fit a hetGP model. X must be s matrix and nrow(X) should be same as length(y)\nhet_gpi &lt;- hetGP::mleHetGP(X = X, Z = y)\n\n# Predictions using the base R predict command with a hetGP object and new locationss\nhet_ppt &lt;- predict(het_gpi, XXt)\n\nNow we obtain the mean and the confidence bounds as well as transform the data to the original scale.\n\n# Mean density for predictive locations and Confidence bounds\nhet_yyt &lt;- het_ppt$mean\nhet_q1t &lt;- qnorm(0.975, het_ppt$mean, sqrt(het_ppt$sd2 + het_ppt$nugs))\nhet_q2t &lt;- qnorm(0.025, het_ppt$mean, sqrt(het_ppt$sd2 + het_ppt$nugs)) \n\n# Back transforming to original scale\nhet_yy &lt;- fi(het_yyt)\nhet_q1 &lt;- fi(het_q1t)\nhet_q2 &lt;- fi(het_q2t)\n\nWe can now plot the results similar to before. [Uncomment the code lines to see how a GP vs a HetGP fits the data]\n\n# Plot Original data\nplot(as.Date(df$datetime), df$observation,\n       main = paste(site_names[site_number]), col = \"black\",\n       xlab = \"Dates\" , ylab = \"Abundance\",\n       # xlim = c(as.Date(min(df$datetime)), as.Date(cutoff)),\n       ylim = c(min(df_train$observation, het_yy, het_q2), max(df_train$observation, het_yy, het_q1)* 1.2))\n\n# Add testing observations\npoints(as.Date(df_test$datetime), df_test$observation, col =\"black\", pch = 19)\n\n# Line to indicate our cutoff point\nabline(v = as.Date(cutoff), lwd = 2)\n\n# HetGP Model mean predictions and bounds.\nlines(grid_datetime, het_yy, col = 2, lwd = 2)\nlines(grid_datetime, het_q1, col = 2, lwd = 1.2, lty = 2)\nlines(grid_datetime, het_q2, col = 2, lwd = 1.2, lty =2)\n\n## GP model fits for the same data\n# lines(grid_datetime, gp_yy, col = 3, lwd = 2)\n# lines(grid_datetime, gp_q1, col = 3, lwd = 1.2, lty = 2)\n# lines(grid_datetime, gp_q2, col = 3, lwd = 1.2, lty =2)\n\nlegend(\"topleft\", legend = c(\"Train Y\",\"Test Y\", \"GP preds\", \"HetGP preds\"),\n         col = c(1, 1, 2, 3), lty = c(NA, NA, 1, 1),\n         pch = c(1, 19, NA, NA), cex = 0.5)\n\n\n\n\n\n\n\n\nThe mean predictions of a GP are similar to that of a hetGP; But the confidence bounds are different. A hetGP produces sligtly tighter bounds.\nWe can also compare the RMSE’s using the predictions of the hetGP model.\n\nyt_true &lt;- f(df_test$observation) # Original data\nhet_yt_pred &lt;- het_yyt[which(grid_datetime  %in% df_test$datetime)] # model preds\n\n# calculate rmse for hetGP model\nrmse_het &lt;- sqrt(mean((yt_true - het_yt_pred)^2))\nrmse_het\n\n[1] 0.8835813\n\n\nNow that we have learnt how to fit a GP and a hetGP, it’s time for a challenge.\nTry a hetGP on our sin example from before (but this time I have added noise).\n\n# Your turn\nset.seed(26)\nn &lt;- 8 # number of points\nX &lt;- matrix(seq(0, 2*pi, length= n), ncol=1) # build inputs \ny &lt;- 5*sin(X) + rnorm(n, 0 , 2) # response with some noise\n\n# Predict on this set\nXX &lt;- matrix(seq(-0.5, 2*pi + 0.5, length= 100), ncol=1)\n\n# Data visualization\nplot(X, y)\n\n\n\n\n\n\n\n# Add code to fit a hetGP model and visualise it as above"
+    "objectID": "Stats_review.html#confidence-intervals",
+    "href": "Stats_review.html#confidence-intervals",
+    "title": "VectorByte Methods Training: Probability and Statistics Fundamentals",
+    "section": "Confidence Intervals",
+    "text": "Confidence Intervals\nSuppose Z_{n-p} \\sim t_{n-p}(0,1). A centered interval is on this t distribution can be written as: \\text{Pr}(-t_{n-p,\\alpha/2} \\&lt; Z\\_{n-p} \\&lt; t_{n-p,\\alpha/2}) = 1-\\alpha. That is, between these values of the t distribution (1-\\alpha)\\times 100 percent of the probability is contained in that symmetric interval. We can visually indicate these location on a plot of the t distribution (here with df=5 and \\alpha=0.05):\n\nx&lt;-seq(-4.5, 4.5, length=1000)\nalpha=0.05\n\n## draw a line showing the normal pdf on the histogram\nplot(x, dt(x, df=5), col=\"black\", lwd=2, type=\"l\", xlab=\"x\", ylab=\"\")\nabline(v=qt(alpha/2, df=5), col=3, lty=2, lwd=2)\nabline(v=qt(1-alpha/2, df=5), col=2, lty=2, lwd=2)\n\nlegend(\"topright\", \n       legend=c(\"t, df=5\", \"lower a/2\", \"upper a/2\"),\n       col=c(1,3,2), lwd=2, lty=c(1, 2,2))\n\n\n\n\n\n\n\n\nIn the R code here, {\\tt qt} is the Student-t “quantile function”. The function {\\tt qt(alpha, df)} returns a value z such that \\alpha = P(Z_{\\mathrm{df}} &lt; z), i.e., t_{\\mathrm{df},\\alpha}.\nHow can we use this to determine the confidence interval for \\theta? Since \\theta \\sim t_{n-p}(\\mu, s^2), we can replace the Z_{n-p} in the interval above with the definition in terms of \\theta, \\mu and s and rearrange: \\begin{align*}\n1-\\alpha& = \\text{Pr}\\left(-t_{n-p,\\alpha/2} &lt; \\frac{\\mu - \\bar{\\theta}}{s} &lt;\nt_{n-p,\\alpha/2}\\right) \\\\\n&=\n\\text{Pr}(\\bar{\\theta}-t_{n-p,\\alpha/2}s &lt; \\mu &lt;\n\\bar{\\theta} + t_{n-p,\\alpha/2}s)\n\\end{align*}\nThus (1-\\alpha)*100% of the time, \\mu is within the confidence interval (written in two equivalent ways):\n\\bar{\\theta} \\pm t_{n-p,\\alpha/2} \\times s \\;\\;\\; \\Leftrightarrow \\;\\;\\; \\bar{\\theta}-t_{n-p,\\alpha/2} \\times s, \\bar{\\theta} + t_{n-p,\\alpha/2}\\times s\nWhy should we care about confidence intervals?\n\nThe confidence interval captures the amount of information in the data about the parameter.\nThe center of the interval tells you what your estimate is.\nThe length of the interval tells you how sure you are about your estimate."
+  },
+  {
+    "objectID": "Stats_review.html#p-values",
+    "href": "Stats_review.html#p-values",
+    "title": "VectorByte Methods Training: Probability and Statistics Fundamentals",
+    "section": "p-Values",
+    "text": "p-Values\nWhat is a p-value? The American Statistical Association issued a statement where they defined it in the following way:\n“Informally, a p-value is the probability under a specified statistical model that a statistical summary of the data (e.g., the sample mean difference between two compared groups) would be equal to or more extreme than its observed value.” (ASA Statement on Statistical Significance and P-Values.)\nMore formally, we formulate a p-value in terms of a null hypothesis/model and test whether or not our observed data are more extreme than we would expect under that specific null model. In your previous courses you’ve probably seen very specific null models, corresponding to, for instance the null hypothesis that the mean of your data is normally distributed with mean m (often m=0). We often denote the null model as H_0 and the alternative as H_a or H_1. For instance, for our example above with \\theta we might want to test the following:\nH_0: \\bar{\\theta}=0 \\;\\;\\; \\text{vs.} \\;\\;\\; H_a: \\bar{\\theta}\\neq 0\nTo perform the hypothesis test we would FIRST choose our rejection level, \\alpha. Although convention is to use \\alpha =0.05 corresponding to a 95% confidence region, one could choose based on how sure one needs to be for a particular application. Next we build our test statistic. There are two cases, first if we know \\sigma and second if we don’t.\nIf we knew the variance \\sigma^2, our test statistic would be Z=\\frac{\\bar{\\theta}-0}{\\sigma}, and we expect that this should have a standard normal distribution, i.e., Z\\sim\\mathcal{N}(0,1). If we don’t know \\sigma and instead estimate is as s (which is most of the time), our test statistic would be Z_{df}=\\frac{\\bar{\\theta}-0}{s} (i.e., it would have a t-distribution).\nWe calculate the value of the appropriate statistic (either Z or Z_{df}) for our data, and then we compare it to the values of the standard distribution (normal or t, respectively) corresponding to the \\alpha level that we chose, i.e., we see if the number that we got for our statistic is inside the horizontal lines that we drew on the standard distribution above. If it is, then the data are consistent with the null hypothesis and we cannot reject the null. If the statistic is outside the region the data are NOT consistent with the null, and instead we reject the null and use the alternative as our new working hypothesis.\nNotice that this process is focused on the null hypothesis. We cannot tell if the alternative hypothesis is true, or, really, if it’s actually better than the null. We can only say that the null is not consistent with our data (i.e., we can falsify the null) at a given level of certainty.\nAlso, the hypothesis testing process is the same as building a confidence interval, as above, and then seeing if the null hypothesis is within your confidence interval. If the null is outside of your confidence interval then you can reject your null at the level of certainty corresponding to the \\alpha that you used to build your CI. If the value for the null is within your CI, you cannot reject at that level."
+  },
+  {
+    "objectID": "Stats_review.html#the-sampling-distribution-1",
+    "href": "Stats_review.html#the-sampling-distribution-1",
+    "title": "VectorByte Methods Training: Probability and Statistics Fundamentals",
+    "section": "The Sampling Distribution",
+    "text": "The Sampling Distribution\nSuppose we have a random sample \\{Y_i, i=1,\\dots,N \\}, where Y_i \\stackrel{\\mathrm{i.i.d.}}{\\sim}N(\\mu,9) for i=1,\\ldots,N.\n\nWhat is the variance of the sample mean?\nWhat is the expectation of the sample mean?\nWhat is the variance for another i.i.d. realization Y_{ N+1}?\nWhat is the standard error of \\bar{Y}?"
+  },
+  {
+    "objectID": "Stats_review.html#hypothesis-testing-and-confidence-intervals",
+    "href": "Stats_review.html#hypothesis-testing-and-confidence-intervals",
+    "title": "VectorByte Methods Training: Probability and Statistics Fundamentals",
+    "section": "Hypothesis Testing and Confidence Intervals",
+    "text": "Hypothesis Testing and Confidence Intervals\nSuppose we sample some data \\{Y_i, i=1,\\dots,n \\}, where Y_i \\stackrel{\\mathrm{i.i.d.}}{\\sim}N(\\mu,\\sigma^2) for i=1,\\ldots,n, and that you want to test the null hypothesis H_0: ~\\mu=12 vs. the alternative H_a: \\mu \\neq 12, at the 0.05 significance level.\n\nWhat test statistic would you use? How do you estimate \\sigma?\nWhat is the distribution for this test statistic if the null is true?\nWhat is the distribution for the test statistic if the null is true and n \\rightarrow \\infty?\nDefine the test rejection region. (I.e., for what values of the test statistic would you reject the null?)\nHow would compute the p-value associated with a particular sample?\nWhat is the 95% confidence interval for \\mu? How should one interpret this interval?\nIf \\bar{Y} = 11, s_y = 1, and n=9, what is the test result? What is the 95% CI for \\mu?"
   }
 ]
\ No newline at end of file
diff --git a/docs/site_libs/revealjs/dist/theme/quarto.css b/docs/site_libs/revealjs/dist/theme/quarto.css
index dc2723a..2577a64 100644
--- a/docs/site_libs/revealjs/dist/theme/quarto.css
+++ b/docs/site_libs/revealjs/dist/theme/quarto.css
@@ -1,4 +1,4 @@
-@import"./fonts/source-sans-pro/source-sans-pro.css";:root{--r-background-color: #fff;--r-main-font: Source Sans Pro, Helvetica, sans-serif;--r-main-font-size: 22pt;--r-main-color: #222;--r-block-margin: 12px;--r-heading-margin: 0 0 12px 0;--r-heading-font: Source Sans Pro, Helvetica, sans-serif;--r-heading-color: #222;--r-heading-line-height: 1.2;--r-heading-letter-spacing: normal;--r-heading-text-transform: none;--r-heading-text-shadow: none;--r-heading-font-weight: 600;--r-heading1-text-shadow: none;--r-heading1-size: 2.5em;--r-heading2-size: 1.6em;--r-heading3-size: 1.3em;--r-heading4-size: 1em;--r-code-font: SFMono-Regular, Menlo, Monaco, Consolas, Liberation Mono, Courier New, monospace;--r-link-color: #2a76dd;--r-link-color-dark: #1a53a1;--r-link-color-hover: #5692e4;--r-selection-background-color: #98bdef;--r-selection-color: #fff}.reveal-viewport{background:#fff;background-color:var(--r-background-color)}.reveal{font-family:var(--r-main-font);font-size:var(--r-main-font-size);font-weight:normal;color:var(--r-main-color)}.reveal ::selection{color:var(--r-selection-color);background:var(--r-selection-background-color);text-shadow:none}.reveal ::-moz-selection{color:var(--r-selection-color);background:var(--r-selection-background-color);text-shadow:none}.reveal .slides section,.reveal .slides section>section{line-height:1.3;font-weight:inherit}.reveal h1,.reveal h2,.reveal h3,.reveal h4,.reveal h5,.reveal h6{margin:var(--r-heading-margin);color:var(--r-heading-color);font-family:var(--r-heading-font);font-weight:var(--r-heading-font-weight);line-height:var(--r-heading-line-height);letter-spacing:var(--r-heading-letter-spacing);text-transform:var(--r-heading-text-transform);text-shadow:var(--r-heading-text-shadow);word-wrap:break-word}.reveal h1{font-size:var(--r-heading1-size)}.reveal h2{font-size:var(--r-heading2-size)}.reveal h3{font-size:var(--r-heading3-size)}.reveal h4{font-size:var(--r-heading4-size)}.reveal h1{text-shadow:var(--r-heading1-text-shadow)}.reveal p{margin:var(--r-block-margin) 0;line-height:1.3}.reveal h1:last-child,.reveal h2:last-child,.reveal h3:last-child,.reveal h4:last-child,.reveal h5:last-child,.reveal h6:last-child{margin-bottom:0}.reveal img,.reveal video,.reveal iframe{max-width:95%;max-height:95%}.reveal strong,.reveal b{font-weight:bold}.reveal em{font-style:italic}.reveal ol,.reveal dl,.reveal ul{display:inline-block;text-align:left;margin:0 0 0 1em}.reveal ol{list-style-type:decimal}.reveal ul{list-style-type:disc}.reveal ul ul{list-style-type:square}.reveal ul ul ul{list-style-type:circle}.reveal ul ul,.reveal ul ol,.reveal ol ol,.reveal ol ul{display:block;margin-left:40px}.reveal dt{font-weight:bold}.reveal dd{margin-left:40px}.reveal blockquote{display:block;position:relative;width:70%;margin:var(--r-block-margin) auto;padding:5px;font-style:italic;background:rgba(255,255,255,.05);box-shadow:0px 0px 2px rgba(0,0,0,.2)}.reveal blockquote p:first-child,.reveal blockquote p:last-child{display:inline-block}.reveal q{font-style:italic}.reveal pre{display:block;position:relative;width:90%;margin:var(--r-block-margin) auto;text-align:left;font-size:.55em;font-family:var(--r-code-font);line-height:1.2em;word-wrap:break-word;box-shadow:0px 5px 15px rgba(0,0,0,.15)}.reveal code{font-family:var(--r-code-font);text-transform:none;tab-size:2}.reveal pre code{display:block;padding:5px;overflow:auto;max-height:400px;word-wrap:normal}.reveal .code-wrapper{white-space:normal}.reveal .code-wrapper code{white-space:pre}.reveal table{margin:auto;border-collapse:collapse;border-spacing:0}.reveal table th{font-weight:bold}.reveal table th,.reveal table td{text-align:left;padding:.2em .5em .2em .5em;border-bottom:1px solid}.reveal table th[align=center],.reveal table td[align=center]{text-align:center}.reveal table th[align=right],.reveal table td[align=right]{text-align:right}.reveal table tbody tr:last-child th,.reveal table tbody tr:last-child td{border-bottom:none}.reveal sup{vertical-align:super;font-size:smaller}.reveal sub{vertical-align:sub;font-size:smaller}.reveal small{display:inline-block;font-size:.6em;line-height:1.2em;vertical-align:top}.reveal small *{vertical-align:top}.reveal img{margin:var(--r-block-margin) 0}.reveal a{color:var(--r-link-color);text-decoration:none;transition:color .15s ease}.reveal a:hover{color:var(--r-link-color-hover);text-shadow:none;border:none}.reveal .roll span:after{color:#fff;background:var(--r-link-color-dark)}.reveal .r-frame{border:4px solid var(--r-main-color);box-shadow:0 0 10px rgba(0,0,0,.15)}.reveal a .r-frame{transition:all .15s linear}.reveal a:hover .r-frame{border-color:var(--r-link-color);box-shadow:0 0 20px rgba(0,0,0,.55)}.reveal .controls{color:var(--r-link-color)}.reveal .progress{background:rgba(0,0,0,.2);color:var(--r-link-color)}@media print{.backgrounds{background-color:var(--r-background-color)}}.top-right{position:absolute;top:1em;right:1em}.visually-hidden{border:0;clip:rect(0 0 0 0);height:auto;margin:0;overflow:hidden;padding:0;position:absolute;width:1px;white-space:nowrap}.hidden{display:none !important}.zindex-bottom{z-index:-1 !important}figure.figure{display:block}.quarto-layout-panel{margin-bottom:1em}.quarto-layout-panel>figure{width:100%}.quarto-layout-panel>figure>figcaption,.quarto-layout-panel>.panel-caption{margin-top:10pt}.quarto-layout-panel>.table-caption{margin-top:0px}.table-caption p{margin-bottom:.5em}.quarto-layout-row{display:flex;flex-direction:row;align-items:flex-start}.quarto-layout-valign-top{align-items:flex-start}.quarto-layout-valign-bottom{align-items:flex-end}.quarto-layout-valign-center{align-items:center}.quarto-layout-cell{position:relative;margin-right:20px}.quarto-layout-cell:last-child{margin-right:0}.quarto-layout-cell figure,.quarto-layout-cell>p{margin:.2em}.quarto-layout-cell img{max-width:100%}.quarto-layout-cell .html-widget{width:100% !important}.quarto-layout-cell div figure p{margin:0}.quarto-layout-cell figure{display:block;margin-inline-start:0;margin-inline-end:0}.quarto-layout-cell table{display:inline-table}.quarto-layout-cell-subref figcaption,figure .quarto-layout-row figure figcaption{text-align:center;font-style:italic}.quarto-figure{position:relative;margin-bottom:1em}.quarto-figure>figure{width:100%;margin-bottom:0}.quarto-figure-left>figure>p,.quarto-figure-left>figure>div{text-align:left}.quarto-figure-center>figure>p,.quarto-figure-center>figure>div{text-align:center}.quarto-figure-right>figure>p,.quarto-figure-right>figure>div{text-align:right}.quarto-figure>figure>div.cell-annotation,.quarto-figure>figure>div code{text-align:left}figure>p:empty{display:none}figure>p:first-child{margin-top:0;margin-bottom:0}figure>figcaption.quarto-float-caption-bottom{margin-bottom:.5em}figure>figcaption.quarto-float-caption-top{margin-top:.5em}div[id^=tbl-]{position:relative}.quarto-figure>.anchorjs-link{position:absolute;top:.6em;right:.5em}div[id^=tbl-]>.anchorjs-link{position:absolute;top:.7em;right:.3em}.quarto-figure:hover>.anchorjs-link,div[id^=tbl-]:hover>.anchorjs-link,h2:hover>.anchorjs-link,h3:hover>.anchorjs-link,h4:hover>.anchorjs-link,h5:hover>.anchorjs-link,h6:hover>.anchorjs-link,.reveal-anchorjs-link>.anchorjs-link{opacity:1}#title-block-header{margin-block-end:1rem;position:relative;margin-top:-1px}#title-block-header .abstract{margin-block-start:1rem}#title-block-header .abstract .abstract-title{font-weight:600}#title-block-header a{text-decoration:none}#title-block-header .author,#title-block-header .date,#title-block-header .doi{margin-block-end:.2rem}#title-block-header .quarto-title-block>div{display:flex}#title-block-header .quarto-title-block>div>h1{flex-grow:1}#title-block-header .quarto-title-block>div>button{flex-shrink:0;height:2.25rem;margin-top:0}tr.header>th>p:last-of-type{margin-bottom:0px}table,table.table{margin-top:.5rem;margin-bottom:.5rem}caption,.table-caption{padding-top:.5rem;padding-bottom:.5rem;text-align:center}figure.quarto-float-tbl figcaption.quarto-float-caption-top{margin-top:.5rem;margin-bottom:.25rem;text-align:center}figure.quarto-float-tbl figcaption.quarto-float-caption-bottom{padding-top:.25rem;margin-bottom:.5rem;text-align:center}.utterances{max-width:none;margin-left:-8px}iframe{margin-bottom:1em}details{margin-bottom:1em}details[show]{margin-bottom:0}details>summary{color:#6f6f6f}details>summary>p:only-child{display:inline}pre.sourceCode,code.sourceCode{position:relative}p code:not(.sourceCode){white-space:pre-wrap}code{white-space:pre}@media print{code{white-space:pre-wrap}}pre>code{display:block}pre>code.sourceCode{white-space:pre}pre>code.sourceCode>span>a:first-child::before{text-decoration:none}pre.code-overflow-wrap>code.sourceCode{white-space:pre-wrap}pre.code-overflow-scroll>code.sourceCode{white-space:pre}code a:any-link{color:inherit;text-decoration:none}code a:hover{color:inherit;text-decoration:underline}ul.task-list{padding-left:1em}[data-tippy-root]{display:inline-block}.tippy-content .footnote-back{display:none}.footnote-back{margin-left:.2em}.tippy-content{overflow-x:auto}.quarto-embedded-source-code{display:none}.quarto-unresolved-ref{font-weight:600}.quarto-cover-image{max-width:35%;float:right;margin-left:30px}.cell-output-display .widget-subarea{margin-bottom:1em}.cell-output-display:not(.no-overflow-x),.knitsql-table:not(.no-overflow-x){overflow-x:auto}.panel-input{margin-bottom:1em}.panel-input>div,.panel-input>div>div{display:inline-block;vertical-align:top;padding-right:12px}.panel-input>p:last-child{margin-bottom:0}.layout-sidebar{margin-bottom:1em}.layout-sidebar .tab-content{border:none}.tab-content>.page-columns.active{display:grid}div.sourceCode>iframe{width:100%;height:300px;margin-bottom:-0.5em}a{text-underline-offset:3px}div.ansi-escaped-output{font-family:monospace;display:block}/*!
+@import"./fonts/source-sans-pro/source-sans-pro.css";:root{--r-background-color: #fff;--r-main-font: Source Sans Pro, Helvetica, sans-serif;--r-main-font-size: 40px;--r-main-color: #222;--r-block-margin: 12px;--r-heading-margin: 0 0 12px 0;--r-heading-font: Source Sans Pro, Helvetica, sans-serif;--r-heading-color: #222;--r-heading-line-height: 1.2;--r-heading-letter-spacing: normal;--r-heading-text-transform: none;--r-heading-text-shadow: none;--r-heading-font-weight: 600;--r-heading1-text-shadow: none;--r-heading1-size: 2.5em;--r-heading2-size: 1.6em;--r-heading3-size: 1.3em;--r-heading4-size: 1em;--r-code-font: SFMono-Regular, Menlo, Monaco, Consolas, Liberation Mono, Courier New, monospace;--r-link-color: #2a76dd;--r-link-color-dark: #1a53a1;--r-link-color-hover: #5692e4;--r-selection-background-color: #98bdef;--r-selection-color: #fff}.reveal-viewport{background:#fff;background-color:var(--r-background-color)}.reveal{font-family:var(--r-main-font);font-size:var(--r-main-font-size);font-weight:normal;color:var(--r-main-color)}.reveal ::selection{color:var(--r-selection-color);background:var(--r-selection-background-color);text-shadow:none}.reveal ::-moz-selection{color:var(--r-selection-color);background:var(--r-selection-background-color);text-shadow:none}.reveal .slides section,.reveal .slides section>section{line-height:1.3;font-weight:inherit}.reveal h1,.reveal h2,.reveal h3,.reveal h4,.reveal h5,.reveal h6{margin:var(--r-heading-margin);color:var(--r-heading-color);font-family:var(--r-heading-font);font-weight:var(--r-heading-font-weight);line-height:var(--r-heading-line-height);letter-spacing:var(--r-heading-letter-spacing);text-transform:var(--r-heading-text-transform);text-shadow:var(--r-heading-text-shadow);word-wrap:break-word}.reveal h1{font-size:var(--r-heading1-size)}.reveal h2{font-size:var(--r-heading2-size)}.reveal h3{font-size:var(--r-heading3-size)}.reveal h4{font-size:var(--r-heading4-size)}.reveal h1{text-shadow:var(--r-heading1-text-shadow)}.reveal p{margin:var(--r-block-margin) 0;line-height:1.3}.reveal h1:last-child,.reveal h2:last-child,.reveal h3:last-child,.reveal h4:last-child,.reveal h5:last-child,.reveal h6:last-child{margin-bottom:0}.reveal img,.reveal video,.reveal iframe{max-width:95%;max-height:95%}.reveal strong,.reveal b{font-weight:bold}.reveal em{font-style:italic}.reveal ol,.reveal dl,.reveal ul{display:inline-block;text-align:left;margin:0 0 0 1em}.reveal ol{list-style-type:decimal}.reveal ul{list-style-type:disc}.reveal ul ul{list-style-type:square}.reveal ul ul ul{list-style-type:circle}.reveal ul ul,.reveal ul ol,.reveal ol ol,.reveal ol ul{display:block;margin-left:40px}.reveal dt{font-weight:bold}.reveal dd{margin-left:40px}.reveal blockquote{display:block;position:relative;width:70%;margin:var(--r-block-margin) auto;padding:5px;font-style:italic;background:rgba(255,255,255,.05);box-shadow:0px 0px 2px rgba(0,0,0,.2)}.reveal blockquote p:first-child,.reveal blockquote p:last-child{display:inline-block}.reveal q{font-style:italic}.reveal pre{display:block;position:relative;width:90%;margin:var(--r-block-margin) auto;text-align:left;font-size:.55em;font-family:var(--r-code-font);line-height:1.2em;word-wrap:break-word;box-shadow:0px 5px 15px rgba(0,0,0,.15)}.reveal code{font-family:var(--r-code-font);text-transform:none;tab-size:2}.reveal pre code{display:block;padding:5px;overflow:auto;max-height:400px;word-wrap:normal}.reveal .code-wrapper{white-space:normal}.reveal .code-wrapper code{white-space:pre}.reveal table{margin:auto;border-collapse:collapse;border-spacing:0}.reveal table th{font-weight:bold}.reveal table th,.reveal table td{text-align:left;padding:.2em .5em .2em .5em;border-bottom:1px solid}.reveal table th[align=center],.reveal table td[align=center]{text-align:center}.reveal table th[align=right],.reveal table td[align=right]{text-align:right}.reveal table tbody tr:last-child th,.reveal table tbody tr:last-child td{border-bottom:none}.reveal sup{vertical-align:super;font-size:smaller}.reveal sub{vertical-align:sub;font-size:smaller}.reveal small{display:inline-block;font-size:.6em;line-height:1.2em;vertical-align:top}.reveal small *{vertical-align:top}.reveal img{margin:var(--r-block-margin) 0}.reveal a{color:var(--r-link-color);text-decoration:none;transition:color .15s ease}.reveal a:hover{color:var(--r-link-color-hover);text-shadow:none;border:none}.reveal .roll span:after{color:#fff;background:var(--r-link-color-dark)}.reveal .r-frame{border:4px solid var(--r-main-color);box-shadow:0 0 10px rgba(0,0,0,.15)}.reveal a .r-frame{transition:all .15s linear}.reveal a:hover .r-frame{border-color:var(--r-link-color);box-shadow:0 0 20px rgba(0,0,0,.55)}.reveal .controls{color:var(--r-link-color)}.reveal .progress{background:rgba(0,0,0,.2);color:var(--r-link-color)}@media print{.backgrounds{background-color:var(--r-background-color)}}.top-right{position:absolute;top:1em;right:1em}.visually-hidden{border:0;clip:rect(0 0 0 0);height:auto;margin:0;overflow:hidden;padding:0;position:absolute;width:1px;white-space:nowrap}.hidden{display:none !important}.zindex-bottom{z-index:-1 !important}figure.figure{display:block}.quarto-layout-panel{margin-bottom:1em}.quarto-layout-panel>figure{width:100%}.quarto-layout-panel>figure>figcaption,.quarto-layout-panel>.panel-caption{margin-top:10pt}.quarto-layout-panel>.table-caption{margin-top:0px}.table-caption p{margin-bottom:.5em}.quarto-layout-row{display:flex;flex-direction:row;align-items:flex-start}.quarto-layout-valign-top{align-items:flex-start}.quarto-layout-valign-bottom{align-items:flex-end}.quarto-layout-valign-center{align-items:center}.quarto-layout-cell{position:relative;margin-right:20px}.quarto-layout-cell:last-child{margin-right:0}.quarto-layout-cell figure,.quarto-layout-cell>p{margin:.2em}.quarto-layout-cell img{max-width:100%}.quarto-layout-cell .html-widget{width:100% !important}.quarto-layout-cell div figure p{margin:0}.quarto-layout-cell figure{display:block;margin-inline-start:0;margin-inline-end:0}.quarto-layout-cell table{display:inline-table}.quarto-layout-cell-subref figcaption,figure .quarto-layout-row figure figcaption{text-align:center;font-style:italic}.quarto-figure{position:relative;margin-bottom:1em}.quarto-figure>figure{width:100%;margin-bottom:0}.quarto-figure-left>figure>p,.quarto-figure-left>figure>div{text-align:left}.quarto-figure-center>figure>p,.quarto-figure-center>figure>div{text-align:center}.quarto-figure-right>figure>p,.quarto-figure-right>figure>div{text-align:right}.quarto-figure>figure>div.cell-annotation,.quarto-figure>figure>div code{text-align:left}figure>p:empty{display:none}figure>p:first-child{margin-top:0;margin-bottom:0}figure>figcaption.quarto-float-caption-bottom{margin-bottom:.5em}figure>figcaption.quarto-float-caption-top{margin-top:.5em}div[id^=tbl-]{position:relative}.quarto-figure>.anchorjs-link{position:absolute;top:.6em;right:.5em}div[id^=tbl-]>.anchorjs-link{position:absolute;top:.7em;right:.3em}.quarto-figure:hover>.anchorjs-link,div[id^=tbl-]:hover>.anchorjs-link,h2:hover>.anchorjs-link,h3:hover>.anchorjs-link,h4:hover>.anchorjs-link,h5:hover>.anchorjs-link,h6:hover>.anchorjs-link,.reveal-anchorjs-link>.anchorjs-link{opacity:1}#title-block-header{margin-block-end:1rem;position:relative;margin-top:-1px}#title-block-header .abstract{margin-block-start:1rem}#title-block-header .abstract .abstract-title{font-weight:600}#title-block-header a{text-decoration:none}#title-block-header .author,#title-block-header .date,#title-block-header .doi{margin-block-end:.2rem}#title-block-header .quarto-title-block>div{display:flex}#title-block-header .quarto-title-block>div>h1{flex-grow:1}#title-block-header .quarto-title-block>div>button{flex-shrink:0;height:2.25rem;margin-top:0}tr.header>th>p:last-of-type{margin-bottom:0px}table,table.table{margin-top:.5rem;margin-bottom:.5rem}caption,.table-caption{padding-top:.5rem;padding-bottom:.5rem;text-align:center}figure.quarto-float-tbl figcaption.quarto-float-caption-top{margin-top:.5rem;margin-bottom:.25rem;text-align:center}figure.quarto-float-tbl figcaption.quarto-float-caption-bottom{padding-top:.25rem;margin-bottom:.5rem;text-align:center}.utterances{max-width:none;margin-left:-8px}iframe{margin-bottom:1em}details{margin-bottom:1em}details[show]{margin-bottom:0}details>summary{color:#6f6f6f}details>summary>p:only-child{display:inline}pre.sourceCode,code.sourceCode{position:relative}p code:not(.sourceCode){white-space:pre-wrap}code{white-space:pre}@media print{code{white-space:pre-wrap}}pre>code{display:block}pre>code.sourceCode{white-space:pre}pre>code.sourceCode>span>a:first-child::before{text-decoration:none}pre.code-overflow-wrap>code.sourceCode{white-space:pre-wrap}pre.code-overflow-scroll>code.sourceCode{white-space:pre}code a:any-link{color:inherit;text-decoration:none}code a:hover{color:inherit;text-decoration:underline}ul.task-list{padding-left:1em}[data-tippy-root]{display:inline-block}.tippy-content .footnote-back{display:none}.footnote-back{margin-left:.2em}.tippy-content{overflow-x:auto}.quarto-embedded-source-code{display:none}.quarto-unresolved-ref{font-weight:600}.quarto-cover-image{max-width:35%;float:right;margin-left:30px}.cell-output-display .widget-subarea{margin-bottom:1em}.cell-output-display:not(.no-overflow-x),.knitsql-table:not(.no-overflow-x){overflow-x:auto}.panel-input{margin-bottom:1em}.panel-input>div,.panel-input>div>div{display:inline-block;vertical-align:top;padding-right:12px}.panel-input>p:last-child{margin-bottom:0}.layout-sidebar{margin-bottom:1em}.layout-sidebar .tab-content{border:none}.tab-content>.page-columns.active{display:grid}div.sourceCode>iframe{width:100%;height:300px;margin-bottom:-0.5em}a{text-underline-offset:3px}div.ansi-escaped-output{font-family:monospace;display:block}/*!
 *
 * ansi colors from IPython notebook's
 *
diff --git a/materials_temp.qmd b/materials_temp.qmd
index d7ef52e..0c66c24 100644
--- a/materials_temp.qmd
+++ b/materials_temp.qmd
@@ -54,16 +54,17 @@ We are assuming familiarity with R basics as well as at least introductory stati
 
 ## Time dependent regression analysis
 
--   [Lecture Slides](VB_IntroTimeDepData.qmd)
--   [Practical](VB_IntroTimeDepData_practical.qmd)
+-   [Lecture Slides](VB_TimeDepData.qmd)
+-   [Practical](VB_TimeDepData_practical.qmd)
 -   Dataset: [Walton Co, FL Mosquito data](/data/Culex_erraticus_walton_covariates_aggregated.csv)
 
 <br> <br>
 
 ## Basics of Time Series using R
 
--   [Integrated Lecture and Activities (coming soon)]()
--   Dataset: [coming soon]()
+-   [Lecture(coming soon)]()
+-   [Practical(coming soon)]()
+-   Datasets: [coming soon]()
 
 <br> <br>
 
@@ -77,8 +78,8 @@ We are assuming familiarity with R basics as well as at least introductory stati
 
 ## Gaussian Process models (GPs) for Time Dependent Data
 
--   [Lecture Slides (coming soon)]()
--   [Lecture Note (coming soon)]()
--   [Practical (coming soon)]()
+-   [Lecture Slides](GP.qmd)
+-   [Lecture Notes](GP_Notes.qmd)
+-   [Practical](GP_Practical.qmd)
 
 <br> <br>