diff --git a/.Rproj.user/shared/notebooks/paths b/.Rproj.user/shared/notebooks/paths
index ce85c5d..7c559bd 100644
--- a/.Rproj.user/shared/notebooks/paths
+++ b/.Rproj.user/shared/notebooks/paths
@@ -1,4 +1,5 @@
-C:/Users/David/Documents/course_pou/01-Introduction.Rmd="6061682F"
-C:/Users/David/Documents/course_pou/01-Introduction2.Rmd="CAE3CA5C"
-C:/Users/David/Documents/course_pou/NOTES.txt="3DE046A6"
-C:/Users/David/Documents/course_pou/_bookdown.yml="C482C268"
+D:/phd/course_pou/14-bootstrap.Rmd="F85B76FF"
+D:/phd/course_pou/15-maximum_likelihood.Rmd="5A6AD4DF"
+D:/phd/course_pou/_bookdown.yml="07C8BE57"
+D:/phd/course_pou/neural_networks.R="4FB0F4BE"
+D:/phd/course_pou/supervised_learning.R="45E91390"
diff --git a/14-bootstrap.Rmd b/14-bootstrap.Rmd
index 6fd36b4..8be3af7 100644
--- a/14-bootstrap.Rmd
+++ b/14-bootstrap.Rmd
@@ -379,3 +379,232 @@ bootstrap(x, T_max)
 # In general, bootstrap will fail when estimating the CI for the maximum.
 ```
 </div> 
+
+```{exercise, name = "Practical - and fictional - coverage interval comparison"}
+In this exercise, we investigate how different kinds of CI's behave as we vary the number of measurements.
+
+The story behind the data: it's 2025 and we've discovered that Slovenia has rich deposits of a rare mineral called Moustachium, which can be used to accelerate moustache growth. This mineral is highly sought, so the government has decided to contract two different companies to provide information on where to begin mining. Both companies investigated mining sites in each statistical region and gave their best estimate of the average Moustachium concentration in tonnes per square kilometer. The Data Science team has been called to estimate the uncertainty in these estimates and help avoid mining in the wrong region.
+
+Generate synthetic data with the script below:
+
+    set.seed(0)
+    
+    library(comprehenr)
+    
+    regions <- c("pomurska", "podravska", "koroska", "savinjska", "zasavska", "posavska", "JV Slovenija", "primorsko-notranjska", "osrednjeslovenska", "gorenjska", "goriska", "obalno-kraska")
+    region_rates <- seq(1.3, 2.3, length.out=length(regions))
+    region_rates <- region_rates[sample.int(length(regions), length(regions))]
+
+    make_dataset <- function(n_contractors) {
+        measurements <- matrix(nrow=length(regions), ncol=n_contractors)
+        for (i in 1:length(regions)) {
+            measurements[i,] <- rgamma(n_contractors, 5.0, region_rates[i])
+        }
+
+        df <- data.frame(measurements)
+        row.names(df) <- regions
+        names(df) <- to_vec(for(i in 1:n_contractors) paste("Contractor", i))
+        return(df)
+    }
+
+    set.seed(0)
+    df_2025 <- make_dataset(2)
+
+    set.seed(0)
+    df_2027 <- make_dataset(10)
+
+    set.seed(0)
+    df_2028 <- make_dataset(100)
+
+    set.seed(0)
+    df_2029 <- make_dataset(1000)
+
+    saveRDS(df_2025, file="moustachium_2025.Rda")
+    saveRDS(df_2027, file="moustachium_2027.Rda")
+    saveRDS(df_2028, file="moustachium_2028.Rda")
+    saveRDS(df_2029, file="moustachium_2029.Rda")
+
+  a. <span style="color:blue">Estimate the average concentration for different regions.</span>
+
+  b. <span style="color:blue">Estimate the average concentration uncertainty using 95% CI's (asymptotic normality with biased and unbiased standard error, standard bootstrap CI, bootstrap percentile CI).</span>
+
+  c. <span style="color:blue">Visualize uncertainties with a histogram and discuss the best location to start mining.</span>
+  
+  d. <span style="color:blue">The year is 2027 and the government has decided to contract 10 companies. Rerun the code with new measurements and discuss how CI's change.</span>
+
+  e. <span style="color:blue">Technological advancements in robotics have enabled site surveys on a massive scale. Repeat the last point for 100 surveyor robots in 2028 and 1000 surveyor robots in 2029.</span>
+```
+<div class = "fold">
+```{r, echo = togs, message = FALSE, eval = togs, warning=FALSE}
+library(ggplot2)
+library(dplyr)
+library(data.table)
+
+set.seed(0)
+
+input_dataset_path = "moustachium_2025.Rda"  # Change this for points d and e
+output_plot_path = "moustachium_2025.pdf"  # Change this for points d and e
+
+df <- readRDS(input_dataset_path)  # Data comes from here
+n_contractors <- ncol(df)
+results_df <- data.frame(region=row.names(df))  # Store CI bounds here
+
+# 1. average concentration for different mining sites
+results_df$average_concetration <- rowMeans(df)
+
+# CI for the mean based on asymptotic normality (biased SE estimate)
+biased_SE <- sqrt(apply(df, 1, function(vec) {sum((vec - mean(vec))^2) / length(vec)}) / n_contractors)
+results_df$ci95.an.biased_var.low <- results_df$average_concetration - 1.96 * biased_SE
+results_df$ci95.an.biased_var.high <- results_df$average_concetration + 1.96 * biased_SE
+
+# CI for the mean based on asymptotic normality (unbiased SE estimate)
+unbiased_SE <- sqrt(apply(df, 1, var) / n_contractors)
+results_df$ci95.an.unbiased_var.low <- results_df$average_concetration - 1.96 * unbiased_SE
+results_df$ci95.an.unbiased_var.high <- results_df$average_concetration + 1.96 * unbiased_SE
+
+# Standard bootstrap CI with 1000 samples
+bootstrap_variance <- function(data, n_samples) {
+  # n_samples is m in pseudocode
+  output <- numeric(n_samples)
+  for (i in 1:n_samples) {
+    index <- sample(1:length(data), length(data), rep = TRUE)
+    resampled_data <- data[index]
+    output[i] <- mean(resampled_data)
+  }
+  return(var(output))
+}
+
+bootstrap_1000_sd <- sqrt(apply(df, 1, function(vec){bootstrap_variance(vec, 1000)}))
+results_df$ci95.bootstrap.standard.1000.low <- results_df$average_concetration - 1.96 * bootstrap_1000_sd
+results_df$ci95.bootstrap.standard.1000.high <- results_df$average_concetration + 1.96 * bootstrap_1000_sd
+
+# Bootstrap percentile CI with 1000 samples
+
+bootstrap_quantile <- function(data, functional, n_samples, probs) {
+    # n_samples is m in pseudocode
+    output <- numeric(n_samples)
+    for (i in 1:n_samples) {
+        index <- sample(1:length(data), length(data), rep = TRUE)
+        resampled_data <- data[index]
+        output[i] <- functional(resampled_data)
+    }
+    return(quantile(output, probs=probs))
+}
+
+results_df$ci95.bootstrap.percentile.1000.low <- apply(df, 1, function(vec){bootstrap_quantile(vec, mean, 1000, 0.025)})
+results_df$ci95.bootstrap.percentile.1000.high <- apply(df, 1, function(vec){bootstrap_quantile(vec, mean, 1000, 0.975)})
+
+results_df
+
+# Visualization: we use a bar chart with uncertainty bands
+
+plot_moustachium_per_region <- function(region_names, average, ci_low, ci_high) {
+    df_visualization <- data.frame(region=region_names, average=average, low=ci_low, high=ci_high)
+    ggplot(df_visualization, aes(x=region, y=average)) + geom_bar(stat="identity")
+}
+
+mask <- endsWith(colnames(results_df), "low")
+mask[c(1, 2)] <- T
+results_df_low <- results_df[, mask]
+colnames(results_df_low) <- gsub('.low','', colnames(results_df_low))
+
+mask <- endsWith(colnames(results_df), "high")
+mask[c(1, 2)] <- T
+results_df_high <- results_df[, mask]
+colnames(results_df_high) <- gsub('.high','', colnames(results_df_high))
+
+long_results_df_low <- melt(setDT(results_df_low), id.vars=c("region", "average_concetration"))
+names(long_results_df_low) <- c("region", "average_concentration", "variable", "low")
+
+long_results_df_high <- melt(setDT(results_df_high), id.vars=c("region", "average_concetration"))
+names(long_results_df_high) <- c("region", "average_concentration", "variable", "high")
+
+long_results_df <- merge(long_results_df_low, long_results_df_high, by=c("region", "variable", "average_concentration"), all=T)
+
+moustachium_plot <- ggplot(long_results_df, aes(x=region, y=average_concentration)) +
+    geom_bar(stat="identity", position="dodge", alpha=0.2) +
+    geom_errorbar(aes(ymin=low, ymax=high, color=variable), width=0.2, position=position_dodge(0.9)) +
+    scale_x_discrete(guide = guide_axis(angle = 45)) +
+    ylim(-1, 8)
+
+# ggsave(plot=moustachium_plot, width=12, height=8, dpi=300, filename=output_plot_path)
+moustachium_plot
+
+# Visualization: we can also use a map. Circle size denotes concentration in region, low transparency denotes high uncertainty.
+
+library(maps)
+
+map_data_slo <- map_data('world')[map_data('world')$region == "Slovenia",]
+
+map_df <- long_results_df[long_results_df$variable == "ci95.an.biased_var", ]
+
+# VERY approximate longitudes and latitudes for different regions.
+map_df$long <- rep(0, nrow(map_df))
+map_df$lat <- rep(0, nrow(map_df))
+
+map_df[map_df$region == "gorenjska"]$long <- 14.2
+map_df[map_df$region == "gorenjska"]$lat <- 46.3
+
+map_df[map_df$region == "goriska"]$long <- 13.85
+map_df[map_df$region == "goriska"]$lat <- 46.0
+
+map_df[map_df$region == "obalno-kraska"]$long <- 13.9
+map_df[map_df$region == "obalno-kraska"]$lat <- 45.65
+
+map_df[map_df$region == "osrednjeslovenska"]$long <- 14.5
+map_df[map_df$region == "osrednjeslovenska"]$lat <- 46.
+
+map_df[map_df$region == "primorsko-notranjska"]$long <- 14.3
+map_df[map_df$region == "primorsko-notranjska"]$lat <- 45.7
+
+map_df[map_df$region == "zasavska"]$long <- 15
+map_df[map_df$region == "zasavska"]$lat <- 46.1
+
+map_df[map_df$region == "savinjska"]$long <- 15.2
+map_df[map_df$region == "savinjska"]$lat <- 46.25
+
+map_df[map_df$region == "posavska"]$long <- 15.4
+map_df[map_df$region == "posavska"]$lat <- 46
+
+map_df[map_df$region == "koroska"]$long <- 15.1
+map_df[map_df$region == "koroska"]$lat <- 46.5
+
+map_df[map_df$region == "podravska"]$long <- 15.7
+map_df[map_df$region == "podravska"]$lat <- 46.45
+
+map_df[map_df$region == "pomurska"]$long <- 16.2
+map_df[map_df$region == "pomurska"]$lat <- 46.65
+
+map_df[map_df$region == "JV Slovenija"]$long <- 15.
+map_df[map_df$region == "JV Slovenija"]$lat <- 45.7
+
+map_df$ci_size <- (map_df$high - map_df$low)
+map_df$ci_y <- map_df$lat - 0.05
+map_df$ci_label <- sprintf("(%.2f, %.2f)", map_df$low, map_df$high)
+map_df$avg_label <- sprintf("%.2f", map_df$average_concentration)
+
+country_plot <- ggplot() +
+    # First layer: worldwide map
+    geom_polygon(data = map_data("world"),
+                 aes(x=long, y=lat, group = group),
+                 color = '#9c9c9c', fill = '#f3f3f3') +
+    # Second layer: Country map
+    geom_polygon(
+        data = map_data_slo,
+        aes(x=long, y=lat, group = group),
+        color='darkgreen', 
+        fill='green', 
+        alpha=0.2
+    ) +
+    geom_point(data=map_df, aes(x=long, y=lat, fill=region, size=average_concentration, alpha=ci_size), color="black", pch=21) +
+    geom_text(data=map_df, aes(x=long, y=ci_y, label=ci_label), size=3) +
+    geom_text(data=map_df, aes(x=long, y=lat, label=avg_label), size=3) +
+    scale_size_continuous(range = c(3, 12), trans = "exp") +
+    scale_alpha_continuous(range = c(0.15, 0.75), trans = "reverse") +
+    ggtitle("Estimated average Moustachium concentration with 95% CI") +
+    coord_cartesian(xlim=c(13.2, 16.7), ylim=c(45.4, 47.))
+
+# ggsave(plot=country_plot, width=18, height=12, dpi=300, filename="country.pdf")
+country_plot
+```
+</div> 
diff --git a/15-maximum_likelihood.Rmd b/15-maximum_likelihood.Rmd
index 22daf82..caa5797 100644
--- a/15-maximum_likelihood.Rmd
+++ b/15-maximum_likelihood.Rmd
@@ -351,6 +351,108 @@ my_pca$rotation
 ```
 </div>
 
+```{exercise, name = "Classification"}
+Let $D = \{(x_i, y_i)\}_{i=1}^n$ be a dataset of feature vectors and their corresponding integer class labels. We wish to classify feature vectors into correct classes.
+
+a. Choose a suitable probability distribution $P_\theta(Y|X)$ and write its log likelihood $\ell$.
+b. Choose a differentiable function $f_\phi$ that predicts parameters $\theta$ from a feature vector, i.e.\ $f_\phi(x_i) = \theta_i$.
+c. <span style="color:blue">Load the _iris_ dataset with `data(iris)` and split it into train and test subsets.</span>
+d. <span style="color:blue">Use gradient descent to find parameters $\phi$ that minimize the negative log likelihood on the _iris_ dataset (equivalently: maximize the log likelihood). Reminder: gradient descent is an iterative optimization procedure $\phi_{t+1} = \phi_t - \eta \nabla_\phi \ell$. Try $\eta = 0.01$ and run optimization for 30 steps. Compute the gradient with `numDeriv::grad`.</span>
+e. <span style="color:blue">Print the classification accuracy for the train and test subsets.</span>
+```
+<div class="fold">
+```{solution, echo = togs}
+a. We pick the categorical distribution.
+b. Categorical distribution parameters are class probabilities that sum to 1. If there are $m$ classes, we can pick any differentiable function that takes as input a vector of features and predicts a vector of size $m$ whose elements are real numbers. We can then use a softmax transformation to map the predicted vector into one with non-negative entries that sum to 1. For simplicity, we can pick a linear transformation with $\phi = (W, b)$, followed by softmax:
+  \begin{align*}
+    f_\phi(x) &= \textrm{softmax}(Wx + b), \\
+    \textrm{softmax}(u)_i &= \frac{\exp(u_i)}{\sum_{j=1}^m \exp(u_j)},
+  \end{align*}
+where $W \in \mathbb{R}^{d\times m}, b \in \mathbb{R}^m$ and $d$ is the number of features.
+```
+```{r, echo = togs, message = FALSE, eval = togs, warning=FALSE}
+data(iris)
+head(iris)
+
+# Model:
+# y ~ Categorical(softmax(weights * features + bias))
+# Want to maximize the (log) likelihood of y w.r.t. weights and bias.
+# Need gradient of log likelihood w.r.t. weights and bias.
+# Proceed by gradient descent on negative log likelihood.
+
+weights <- matrix(data=rnorm(4 * 3), nrow=4, ncol=3)
+bias <- matrix(data=rnorm(3), nrow=1, ncol=3)
+
+model <- function(features, weights, bias) {
+  # parameters is a 5-element vector. First four are weights, last is bias.
+  return(t(features %*% weights + bias))
+}
+
+softmax <- function(v) {
+  return(exp(v) / sum(exp(v)))
+}
+
+categorical_mass <- function(targets, probs) {
+  # targets: matrix of size (n_data, n_classes) whose rows are one-hot vectors
+  # probs: matrix of size (n_data, n_classes) whose rows are class probabilities
+  apply(probs * targets, 1, sum)
+}
+
+predict_probs <- function(features, model, parameters) {
+  weights <- parameters[1:4, ]
+  bias <- parameters[5, ]
+  u <- model(features, weights, bias)
+  apply(u, 1, softmax)
+}
+
+accuracy <- function(features, targets, model, parameters) {
+  probs <- predict_probs(features, model, parameters)
+  argmax_mat <- t(apply(probs, 1, function(v) {v == max(v)}))
+  correct_predictions <- apply(argmax_mat * targets, 1, sum)
+  return(mean(correct_predictions))
+}
+
+neg_log_lik <- function(features, targets, model, parameters) {
+  probs <- predict_probs(features, model, parameters)
+  -sum(log(categorical_mass(targets, probs)))
+}
+
+grad_neg_log_lik <- function(features, targets, model, parameters){
+  numDeriv::grad(function(par){neg_log_lik(features, targets, model, par)}, parameters)
+}
+
+gradient_descent <- function(initial_parameters, features, targets, step_size = 0.01, n_steps = 30) {
+  parameters <- initial_parameters
+  for (i in 1:n_steps) {
+    print(sprintf("[%d] loss: %.4f, accuracy: %.2f", i, neg_log_lik(features, targets, model, parameters), accuracy(features, targets, model, parameters)))
+    parameters <- parameters - step_size * grad_neg_log_lik(features, targets, model, parameters)
+  }
+  return(parameters)
+}
+
+
+x <- as.matrix(subset(iris, select=-c(Species)))
+y <- matrix(nrow=nrow(iris), ncol=3)
+y[, 1] <- iris$Species == "setosa"
+y[, 2] <- iris$Species == "versicolor"
+y[, 3] <- iris$Species == "virginica"
+
+# Take an equal number of representatives for every class for the training and test subsets
+# Note: code is written so that shuffling does not matter during optimization
+x_train <- x[c(1:35, 51:85, 101:135), ]
+y_train <- y[c(1:35, 51:85, 101:135), ]
+
+x_test <- x[-c(1:35, 51:85, 101:135), ]
+y_test <- y[-c(1:35, 51:85, 101:135), ]
+
+set.seed(0)
+optimized_parameters <- gradient_descent(rbind(weights, bias), x_train, y_train)
+
+accuracy(x_train, y_train, model, optimized_parameters)
+accuracy(x_test, y_test, model, optimized_parameters)
+```
+</div>
+
 
 ## Fisher information
 ```{exercise}
@@ -507,6 +609,84 @@ ggplot() +
 ```
 </div>
 
+```{exercise}
+
+
+Find the unit Fisher information matrix for the univariate normal distribution.
+```
+<div class="fold">
+```{solution, echo = togs}
+
+
+The normal density is
+\begin{equation*}
+  p(x; \mu, \sigma) = \frac{1}{\sqrt{2\pi \sigma^2}} \exp\left(-0.5 \frac{(x-\mu)^2}{\sigma^2}\right).
+\end{equation*}
+
+Its logarithm is 
+\begin{equation*}
+  \log p(x; \mu, \sigma) = -0.5\log(2\pi) - \log \sigma - 0.5 \frac{(x-\mu)^2}{\sigma^2}.
+\end{equation*}
+  
+The second order partial derivatives are
+\begin{align*}
+  \frac{\partial}{\partial \mu^2} p(x; \mu, \sigma) &= -\frac{1}{\sigma^2}, \\
+  \frac{\partial}{\partial \mu \partial  \sigma} p(x; \mu, \sigma) &= -\frac{2(x-\mu)^2}{\sigma^3}, \\
+  \frac{\partial^2}{\partial \sigma^2} p(x; \mu, \sigma) &= \frac{1}{\sigma^2} - \frac{3(x-\mu)^2}{\sigma^4}.
+\end{align*}
+
+The unit Fisher information matrix is then
+\begin{align*}
+I(\mu, \sigma) =
+  -  E\left[
+    \begin{bmatrix}
+    -\frac{1}{\sigma^2}       & -\frac{2(x-\mu)}{\sigma^3} \\
+    -\frac{2(x-\mu)}{\sigma^3} & \frac{1}{\sigma^2} - \frac{3(x-\mu)^2}{\sigma^4}
+  \end{bmatrix}
+  \right] = 
+  \begin{bmatrix}
+      \frac{1}{\sigma^2}       & 0 \\
+      0 & \frac{2}{\sigma^2}
+    \end{bmatrix},
+\end{align*}
+where we used the fact that $E[X - \mu] = 0$ and $E[(X - \mu)^2] = \sigma^2$.
+
+```
+</div>
+
+```{exercise}
+Find the unit Fisher information for the binomial distribution with fixed $n$.
+```
+<div class="fold">
+```{solution, echo = togs}
+
+The binomial mass is
+\begin{equation*}
+  P(X = k; n, p) = \binom{n}{k}p^k(1-p)^{n-k}.
+\end{equation*}
+
+Its logarithm is 
+\begin{equation*}
+  \log P(X = k; n, p) = \log \binom{n}{k} + k\log p + (n-k)\log(1-p).
+\end{equation*}
+  
+The partial derivatives are
+\begin{align*}
+  \frac{\partial}{\partial p} \log P(X = k; n, p) &= \frac{k}{p} - \frac{n-k}{1-p}, \\
+  \frac{\partial^2}{\partial p^2} \log P(X = k; n, p) &= -\frac{k}{p^2} - \frac{n-k}{(1-p)^2}.
+\end{align*}
+
+The unit Fisher information is
+\begin{align*}
+I(p) =
+  -  E\left[ \frac{\partial^2}{\partial p^2} \log P(X = k; n, p) \right] = 
+  \frac{n}{p(1-p)},
+\end{align*}
+where we used the fact that $E[k] = np$ for $k \sim X$.
+
+```
+</div>
+
 ## The German tank problem
 ```{exercise, name = "The German tank problem"}
 During WWII the allied intelligence were faced with an important problem of estimating the total production of certain German tanks, such as the Panther. What turned out to be a successful approach was to estimate the maximum from the serial numbers of the small sample of captured or destroyed tanks (describe the statistical model used).
diff --git a/_bookdown.yml b/_bookdown.yml
index 074641f..e7f4531 100644
--- a/_bookdown.yml
+++ b/_bookdown.yml
@@ -3,5 +3,5 @@ chapter_name: "Chapter "
 output_dir: docs
 rmd_files: ["index.Rmd", "01-Introduction.Rmd", "02-uncountable_probability_spaces.Rmd", "03-conditional_probability.Rmd", "04-random_variables.Rmd", "05-multiple_random_variables.Rmd", "06-integration.Rmd", "07-expected_value.Rmd", "08-multivariate_random_variables.Rmd", "09-alternative_representations.Rmd", "10-concentration_inequalities.Rmd", "11-convergence_of_random_variables.Rmd", "12-limit_theorems.Rmd", "13-estimation_basics.Rmd", "14-bootstrap.Rmd", "15-maximum_likelihood.Rmd", "16-null_hypothesis_significance_tests.Rmd", "17-Bayesian_inference.Rmd","18-distributions_intuition.Rmd", "Appendix.Rmd", "A1-R_programming_language.Rmd", "A2-probability_distributions2.Rmd", "References.Rmd"]
 new_session: no
-
+delete_merged_file: true
 
diff --git a/docs/404.html b/docs/404.html
index 908fd67..25397a0 100644
--- a/docs/404.html
+++ b/docs/404.html
@@ -6,7 +6,7 @@
   <meta http-equiv="X-UA-Compatible" content="IE=edge" />
   <title>Page not found | Principles of Uncertainty – exercises</title>
   <meta name="description" content="Course notes" />
-  <meta name="generator" content="bookdown 0.36 and GitBook 2.6.7" />
+  <meta name="generator" content="bookdown 0.37 and GitBook 2.6.7" />
 
   <meta property="og:title" content="Page not found | Principles of Uncertainty – exercises" />
   <meta property="og:type" content="book" />
@@ -23,7 +23,7 @@
 <meta name="author" content="Gregor Pirš, Erik Štrumbelj, David Nabergoj and Leon Hvastja" />
 
 
-<meta name="date" content="2023-11-16" />
+<meta name="date" content="2024-01-11" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1" />
   <meta name="apple-mobile-web-app-capable" content="yes" />
diff --git a/docs/bookdown-pou_files/figure-html/unnamed-chunk-13-1.png b/docs/bookdown-pou_files/figure-html/unnamed-chunk-13-1.png
index 1c7dc8b..111b79e 100644
Binary files a/docs/bookdown-pou_files/figure-html/unnamed-chunk-13-1.png and b/docs/bookdown-pou_files/figure-html/unnamed-chunk-13-1.png differ
diff --git a/docs/bookdown-pou_files/figure-html/unnamed-chunk-13-2.png b/docs/bookdown-pou_files/figure-html/unnamed-chunk-13-2.png
new file mode 100644
index 0000000..bb0eb40
Binary files /dev/null and b/docs/bookdown-pou_files/figure-html/unnamed-chunk-13-2.png differ
diff --git a/docs/bookdown-pou_files/figure-html/unnamed-chunk-14-1.png b/docs/bookdown-pou_files/figure-html/unnamed-chunk-14-1.png
index 39af057..047f9da 100644
Binary files a/docs/bookdown-pou_files/figure-html/unnamed-chunk-14-1.png and b/docs/bookdown-pou_files/figure-html/unnamed-chunk-14-1.png differ
diff --git a/docs/bookdown-pou_files/figure-html/unnamed-chunk-23-1.png b/docs/bookdown-pou_files/figure-html/unnamed-chunk-23-1.png
index 8d3d0b5..6e21371 100644
Binary files a/docs/bookdown-pou_files/figure-html/unnamed-chunk-23-1.png and b/docs/bookdown-pou_files/figure-html/unnamed-chunk-23-1.png differ
diff --git a/docs/bookdown-pou_files/figure-html/unnamed-chunk-24-1.png b/docs/bookdown-pou_files/figure-html/unnamed-chunk-24-1.png
index 1ee82b6..6e21371 100644
Binary files a/docs/bookdown-pou_files/figure-html/unnamed-chunk-24-1.png and b/docs/bookdown-pou_files/figure-html/unnamed-chunk-24-1.png differ
diff --git a/docs/bookdown-pou_files/figure-html/unnamed-chunk-26-1.png b/docs/bookdown-pou_files/figure-html/unnamed-chunk-26-1.png
index 1283656..0df7ee9 100644
Binary files a/docs/bookdown-pou_files/figure-html/unnamed-chunk-26-1.png and b/docs/bookdown-pou_files/figure-html/unnamed-chunk-26-1.png differ
diff --git a/docs/bookdown-pou_files/figure-html/unnamed-chunk-27-1.png b/docs/bookdown-pou_files/figure-html/unnamed-chunk-27-1.png
index 6067ca9..0df7ee9 100644
Binary files a/docs/bookdown-pou_files/figure-html/unnamed-chunk-27-1.png and b/docs/bookdown-pou_files/figure-html/unnamed-chunk-27-1.png differ
diff --git a/docs/bookdown-pou_files/figure-html/unnamed-chunk-28-1.png b/docs/bookdown-pou_files/figure-html/unnamed-chunk-28-1.png
index e7fa4a2..0df7ee9 100644
Binary files a/docs/bookdown-pou_files/figure-html/unnamed-chunk-28-1.png and b/docs/bookdown-pou_files/figure-html/unnamed-chunk-28-1.png differ
diff --git a/docs/bookdown-pou_files/figure-html/unnamed-chunk-30-1.png b/docs/bookdown-pou_files/figure-html/unnamed-chunk-30-1.png
index dc9818e..0df7ee9 100644
Binary files a/docs/bookdown-pou_files/figure-html/unnamed-chunk-30-1.png and b/docs/bookdown-pou_files/figure-html/unnamed-chunk-30-1.png differ
diff --git a/docs/bookdown-pou_files/figure-html/unnamed-chunk-31-1.png b/docs/bookdown-pou_files/figure-html/unnamed-chunk-31-1.png
index c5574a0..0df7ee9 100644
Binary files a/docs/bookdown-pou_files/figure-html/unnamed-chunk-31-1.png and b/docs/bookdown-pou_files/figure-html/unnamed-chunk-31-1.png differ
diff --git a/docs/bookdown-pou_files/figure-html/unnamed-chunk-6-1.png b/docs/bookdown-pou_files/figure-html/unnamed-chunk-6-1.png
index 777ea43..b5bc9e6 100644
Binary files a/docs/bookdown-pou_files/figure-html/unnamed-chunk-6-1.png and b/docs/bookdown-pou_files/figure-html/unnamed-chunk-6-1.png differ
diff --git a/docs/bookdown-pou_files/figure-html/unnamed-chunk-9-1.png b/docs/bookdown-pou_files/figure-html/unnamed-chunk-9-1.png
index ed5abff..3e02f67 100644
Binary files a/docs/bookdown-pou_files/figure-html/unnamed-chunk-9-1.png and b/docs/bookdown-pou_files/figure-html/unnamed-chunk-9-1.png differ
diff --git a/docs/bookdown-pou_files/figure-html/unnamed-chunk-9-2.png b/docs/bookdown-pou_files/figure-html/unnamed-chunk-9-2.png
index 808921d..6ecc76d 100644
Binary files a/docs/bookdown-pou_files/figure-html/unnamed-chunk-9-2.png and b/docs/bookdown-pou_files/figure-html/unnamed-chunk-9-2.png differ
diff --git a/docs/boot.html b/docs/boot.html
index 0a6b41e..b0e77d4 100644
--- a/docs/boot.html
+++ b/docs/boot.html
@@ -6,7 +6,7 @@
   <meta http-equiv="X-UA-Compatible" content="IE=edge" />
   <title>Chapter 14 Bootstrap | Principles of Uncertainty – exercises</title>
   <meta name="description" content="Course notes" />
-  <meta name="generator" content="bookdown 0.35 and GitBook 2.6.7" />
+  <meta name="generator" content="bookdown 0.37 and GitBook 2.6.7" />
 
   <meta property="og:title" content="Chapter 14 Bootstrap | Principles of Uncertainty – exercises" />
   <meta property="og:type" content="book" />
@@ -23,7 +23,7 @@
 <meta name="author" content="Gregor Pirš, Erik Štrumbelj, David Nabergoj and Leon Hvastja" />
 
 
-<meta name="date" content="2023-10-02" />
+<meta name="date" content="2024-01-11" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1" />
   <meta name="apple-mobile-web-app-capable" content="yes" />
@@ -327,7 +327,7 @@ <h1><span class="header-section-number">Chapter 14</span> Bootstrap<a href="boot
 });
 </script>
 <div class="exercise">
-<p><span id="exr:unnamed-chunk-223" class="exercise"><strong>Exercise 14.1  </strong></span><span style="color:blue">Ideally, a <span class="math inline">\(1-\alpha\)</span> CI would have <span class="math inline">\(1-\alpha\)</span> coverage. That is, say a 95% CI should, in the long run, contain the true value of the parameter 95% of the time. In practice, it is impossible to assess the coverage of our CI method, because we rarely know the true parameter. In simulation, however, we can. Let’s assess the coverage of bootstrap percentile intervals.</span></p>
+<p><span id="exr:unnamed-chunk-2" class="exercise"><strong>Exercise 14.1  </strong></span><span style="color:blue">Ideally, a <span class="math inline">\(1-\alpha\)</span> CI would have <span class="math inline">\(1-\alpha\)</span> coverage. That is, say a 95% CI should, in the long run, contain the true value of the parameter 95% of the time. In practice, it is impossible to assess the coverage of our CI method, because we rarely know the true parameter. In simulation, however, we can. Let’s assess the coverage of bootstrap percentile intervals.</span></p>
 <ol style="list-style-type: lower-alpha">
 <li><p><span style="color:blue">Pick a univariate distribution with readily available mean and one that you can easily sample from.</span></p></li>
 <li><p><span style="color:blue">Draw <span class="math inline">\(n = 30\)</span> random samples from the chosen distribution and use the bootstrap (with large enough m) and percentile CI method to construct 95% CI. Repeat the process many times and count how many times the CI contains the true mean. That is, compute the actual coverage probability (don’t forget to include the standard error of the coverage probability!). What can you observe?</span></p></li>
@@ -338,91 +338,91 @@ <h1><span class="header-section-number">Chapter 14</span> Bootstrap<a href="boot
 </ol>
 </div>
 <div class="fold">
-<div class="sourceCode" id="cb183"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb183-1"><a href="boot.html#cb183-1" tabindex="-1"></a><span class="fu">library</span>(boot)</span>
-<span id="cb183-2"><a href="boot.html#cb183-2" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">0</span>)</span>
-<span id="cb183-3"><a href="boot.html#cb183-3" tabindex="-1"></a>nit   <span class="ot">&lt;-</span> <span class="dv">1000</span>  <span class="co"># Repeat the process &quot;many times&quot;</span></span>
-<span id="cb183-4"><a href="boot.html#cb183-4" tabindex="-1"></a>alpha <span class="ot">&lt;-</span> <span class="fl">0.05</span>  <span class="co"># CI parameter</span></span>
-<span id="cb183-5"><a href="boot.html#cb183-5" tabindex="-1"></a>nboot <span class="ot">&lt;-</span> <span class="dv">100</span>   <span class="co"># m parameter for bootstrap (&quot;large enough m&quot;)</span></span>
-<span id="cb183-6"><a href="boot.html#cb183-6" tabindex="-1"></a><span class="co"># f: change this to 200 or 5.</span></span>
-<span id="cb183-7"><a href="boot.html#cb183-7" tabindex="-1"></a>nsample <span class="ot">&lt;-</span> <span class="dv">30</span>  <span class="co"># n = 30 random samples from the chosen distribution. Comment out BCa code if it breaks.</span></span>
-<span id="cb183-8"><a href="boot.html#cb183-8" tabindex="-1"></a>covers     <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="at">nrow =</span> nit, <span class="at">ncol =</span> <span class="dv">3</span>)</span>
-<span id="cb183-9"><a href="boot.html#cb183-9" tabindex="-1"></a>covers_BCa <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="at">nrow =</span> nit, <span class="at">ncol =</span> <span class="dv">3</span>)</span>
-<span id="cb183-10"><a href="boot.html#cb183-10" tabindex="-1"></a>covers_asymp_norm <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="at">nrow =</span> nit, <span class="at">ncol =</span> <span class="dv">3</span>)</span>
-<span id="cb183-11"><a href="boot.html#cb183-11" tabindex="-1"></a></span>
-<span id="cb183-12"><a href="boot.html#cb183-12" tabindex="-1"></a>isin <span class="ot">&lt;-</span> <span class="cf">function</span> (x, lower, upper) {</span>
-<span id="cb183-13"><a href="boot.html#cb183-13" tabindex="-1"></a>  (x <span class="sc">&gt;</span> lower) <span class="sc">&amp;</span> (x <span class="sc">&lt;</span> upper)</span>
-<span id="cb183-14"><a href="boot.html#cb183-14" tabindex="-1"></a>}</span>
-<span id="cb183-15"><a href="boot.html#cb183-15" tabindex="-1"></a></span>
-<span id="cb183-16"><a href="boot.html#cb183-16" tabindex="-1"></a><span class="cf">for</span> (j <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>nit) {  <span class="co"># Repeating many times</span></span>
-<span id="cb183-17"><a href="boot.html#cb183-17" tabindex="-1"></a>  <span class="co"># a: pick a univariate distribution - standard normal</span></span>
-<span id="cb183-18"><a href="boot.html#cb183-18" tabindex="-1"></a>  x1 <span class="ot">&lt;-</span> <span class="fu">rnorm</span>(nsample)</span>
-<span id="cb183-19"><a href="boot.html#cb183-19" tabindex="-1"></a>  </span>
-<span id="cb183-20"><a href="boot.html#cb183-20" tabindex="-1"></a>  <span class="co"># c: one or two different distributions - beta and poisson</span></span>
-<span id="cb183-21"><a href="boot.html#cb183-21" tabindex="-1"></a>  x2 <span class="ot">&lt;-</span> <span class="fu">rbeta</span>(nsample, <span class="dv">1</span>, <span class="dv">2</span>)</span>
-<span id="cb183-22"><a href="boot.html#cb183-22" tabindex="-1"></a>  x3 <span class="ot">&lt;-</span> <span class="fu">rpois</span>(nsample, <span class="dv">5</span>)</span>
-<span id="cb183-23"><a href="boot.html#cb183-23" tabindex="-1"></a>  </span>
-<span id="cb183-24"><a href="boot.html#cb183-24" tabindex="-1"></a>  X1 <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="at">data =</span> <span class="cn">NA</span>, <span class="at">nrow =</span> nsample, <span class="at">ncol =</span> nboot)</span>
-<span id="cb183-25"><a href="boot.html#cb183-25" tabindex="-1"></a>  X2 <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="at">data =</span> <span class="cn">NA</span>, <span class="at">nrow =</span> nsample, <span class="at">ncol =</span> nboot)</span>
-<span id="cb183-26"><a href="boot.html#cb183-26" tabindex="-1"></a>  X3 <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="at">data =</span> <span class="cn">NA</span>, <span class="at">nrow =</span> nsample, <span class="at">ncol =</span> nboot)</span>
-<span id="cb183-27"><a href="boot.html#cb183-27" tabindex="-1"></a>  <span class="cf">for</span> (i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>nboot) {</span>
-<span id="cb183-28"><a href="boot.html#cb183-28" tabindex="-1"></a>    X1[ ,i] <span class="ot">&lt;-</span> <span class="fu">sample</span>(x1, nsample, <span class="at">replace =</span> T)</span>
-<span id="cb183-29"><a href="boot.html#cb183-29" tabindex="-1"></a>    X2[ ,i] <span class="ot">&lt;-</span> <span class="fu">sample</span>(x2, nsample, T)</span>
-<span id="cb183-30"><a href="boot.html#cb183-30" tabindex="-1"></a>    X3[ ,i] <span class="ot">&lt;-</span> <span class="fu">sample</span>(x3, nsample, T)</span>
-<span id="cb183-31"><a href="boot.html#cb183-31" tabindex="-1"></a>  }</span>
-<span id="cb183-32"><a href="boot.html#cb183-32" tabindex="-1"></a>  X1_func <span class="ot">&lt;-</span> <span class="fu">apply</span>(X1, <span class="dv">2</span>, mean)</span>
-<span id="cb183-33"><a href="boot.html#cb183-33" tabindex="-1"></a>  X2_func <span class="ot">&lt;-</span> <span class="fu">apply</span>(X2, <span class="dv">2</span>, mean)</span>
-<span id="cb183-34"><a href="boot.html#cb183-34" tabindex="-1"></a>  X3_func <span class="ot">&lt;-</span> <span class="fu">apply</span>(X3, <span class="dv">2</span>, mean)</span>
-<span id="cb183-35"><a href="boot.html#cb183-35" tabindex="-1"></a>  X1_quant <span class="ot">&lt;-</span> <span class="fu">quantile</span>(X1_func, <span class="at">probs =</span> <span class="fu">c</span>(alpha <span class="sc">/</span> <span class="dv">2</span>, <span class="dv">1</span> <span class="sc">-</span> alpha <span class="sc">/</span> <span class="dv">2</span>))</span>
-<span id="cb183-36"><a href="boot.html#cb183-36" tabindex="-1"></a>  X2_quant <span class="ot">&lt;-</span> <span class="fu">quantile</span>(X2_func, <span class="at">probs =</span> <span class="fu">c</span>(alpha <span class="sc">/</span> <span class="dv">2</span>, <span class="dv">1</span> <span class="sc">-</span> alpha <span class="sc">/</span> <span class="dv">2</span>))</span>
-<span id="cb183-37"><a href="boot.html#cb183-37" tabindex="-1"></a>  X3_quant <span class="ot">&lt;-</span> <span class="fu">quantile</span>(X3_func, <span class="at">probs =</span> <span class="fu">c</span>(alpha <span class="sc">/</span> <span class="dv">2</span>, <span class="dv">1</span> <span class="sc">-</span> alpha <span class="sc">/</span> <span class="dv">2</span>))</span>
-<span id="cb183-38"><a href="boot.html#cb183-38" tabindex="-1"></a>  covers[j,<span class="dv">1</span>] <span class="ot">&lt;-</span> (<span class="dv">0</span> <span class="sc">&gt;</span> X1_quant[<span class="dv">1</span>]) <span class="sc">&amp;</span> (<span class="dv">0</span> <span class="sc">&lt;</span> X1_quant[<span class="dv">2</span>])</span>
-<span id="cb183-39"><a href="boot.html#cb183-39" tabindex="-1"></a>  covers[j,<span class="dv">2</span>] <span class="ot">&lt;-</span> ((<span class="dv">1</span> <span class="sc">/</span> <span class="dv">3</span>) <span class="sc">&gt;</span> X2_quant[<span class="dv">1</span>]) <span class="sc">&amp;</span> ((<span class="dv">1</span> <span class="sc">/</span> <span class="dv">3</span>) <span class="sc">&lt;</span> X2_quant[<span class="dv">2</span>])</span>
-<span id="cb183-40"><a href="boot.html#cb183-40" tabindex="-1"></a>  covers[j,<span class="dv">3</span>] <span class="ot">&lt;-</span> (<span class="dv">5</span> <span class="sc">&gt;</span> X3_quant[<span class="dv">1</span>]) <span class="sc">&amp;</span> (<span class="dv">5</span> <span class="sc">&lt;</span> X3_quant[<span class="dv">2</span>])</span>
-<span id="cb183-41"><a href="boot.html#cb183-41" tabindex="-1"></a></span>
-<span id="cb183-42"><a href="boot.html#cb183-42" tabindex="-1"></a>  mf     <span class="ot">&lt;-</span> <span class="cf">function</span> (x, i) <span class="fu">return</span>(<span class="fu">mean</span>(x[i]))</span>
-<span id="cb183-43"><a href="boot.html#cb183-43" tabindex="-1"></a>  bootX1 <span class="ot">&lt;-</span> <span class="fu">boot</span>(x1, <span class="at">statistic =</span> mf, <span class="at">R =</span> nboot)</span>
-<span id="cb183-44"><a href="boot.html#cb183-44" tabindex="-1"></a>  bootX2 <span class="ot">&lt;-</span> <span class="fu">boot</span>(x2, <span class="at">statistic =</span> mf, <span class="at">R =</span> nboot)</span>
-<span id="cb183-45"><a href="boot.html#cb183-45" tabindex="-1"></a>  bootX3 <span class="ot">&lt;-</span> <span class="fu">boot</span>(x3, <span class="at">statistic =</span> mf, <span class="at">R =</span> nboot)</span>
-<span id="cb183-46"><a href="boot.html#cb183-46" tabindex="-1"></a></span>
-<span id="cb183-47"><a href="boot.html#cb183-47" tabindex="-1"></a>  X1_quant_BCa <span class="ot">&lt;-</span> <span class="fu">boot.ci</span>(bootX1, <span class="at">type =</span> <span class="st">&quot;bca&quot;</span>)<span class="sc">$</span>bca</span>
-<span id="cb183-48"><a href="boot.html#cb183-48" tabindex="-1"></a>  X2_quant_BCa <span class="ot">&lt;-</span> <span class="fu">boot.ci</span>(bootX2, <span class="at">type =</span> <span class="st">&quot;bca&quot;</span>)<span class="sc">$</span>bca</span>
-<span id="cb183-49"><a href="boot.html#cb183-49" tabindex="-1"></a>  X3_quant_BCa <span class="ot">&lt;-</span> <span class="fu">boot.ci</span>(bootX3, <span class="at">type =</span> <span class="st">&quot;bca&quot;</span>)<span class="sc">$</span>bca</span>
-<span id="cb183-50"><a href="boot.html#cb183-50" tabindex="-1"></a>  </span>
-<span id="cb183-51"><a href="boot.html#cb183-51" tabindex="-1"></a>  covers_BCa[j,<span class="dv">1</span>] <span class="ot">&lt;-</span> (<span class="dv">0</span> <span class="sc">&gt;</span> X1_quant_BCa[<span class="dv">4</span>]) <span class="sc">&amp;</span> (<span class="dv">0</span> <span class="sc">&lt;</span> X1_quant_BCa[<span class="dv">5</span>])</span>
-<span id="cb183-52"><a href="boot.html#cb183-52" tabindex="-1"></a>  covers_BCa[j,<span class="dv">2</span>] <span class="ot">&lt;-</span> ((<span class="dv">1</span> <span class="sc">/</span> <span class="dv">3</span>) <span class="sc">&gt;</span> X2_quant_BCa[<span class="dv">4</span>]) <span class="sc">&amp;</span> ((<span class="dv">1</span> <span class="sc">/</span> <span class="dv">3</span>) <span class="sc">&lt;</span> X2_quant_BCa[<span class="dv">5</span>])</span>
-<span id="cb183-53"><a href="boot.html#cb183-53" tabindex="-1"></a>  covers_BCa[j,<span class="dv">3</span>] <span class="ot">&lt;-</span> (<span class="dv">5</span> <span class="sc">&gt;</span> X3_quant_BCa[<span class="dv">4</span>]) <span class="sc">&amp;</span> (<span class="dv">5</span> <span class="sc">&lt;</span> X3_quant_BCa[<span class="dv">5</span>])</span>
-<span id="cb183-54"><a href="boot.html#cb183-54" tabindex="-1"></a>  </span>
-<span id="cb183-55"><a href="boot.html#cb183-55" tabindex="-1"></a>  <span class="co"># e: estimate mean and standard error</span></span>
-<span id="cb183-56"><a href="boot.html#cb183-56" tabindex="-1"></a>  <span class="co"># sample mean:</span></span>
-<span id="cb183-57"><a href="boot.html#cb183-57" tabindex="-1"></a>  x1_bar <span class="ot">&lt;-</span> <span class="fu">mean</span>(x1)</span>
-<span id="cb183-58"><a href="boot.html#cb183-58" tabindex="-1"></a>  x2_bar <span class="ot">&lt;-</span> <span class="fu">mean</span>(x2)</span>
-<span id="cb183-59"><a href="boot.html#cb183-59" tabindex="-1"></a>  x3_bar <span class="ot">&lt;-</span> <span class="fu">mean</span>(x3)</span>
-<span id="cb183-60"><a href="boot.html#cb183-60" tabindex="-1"></a>  </span>
-<span id="cb183-61"><a href="boot.html#cb183-61" tabindex="-1"></a>  <span class="co"># standard error (of the sample mean) estimate: sample standard deviation / sqrt(n)</span></span>
-<span id="cb183-62"><a href="boot.html#cb183-62" tabindex="-1"></a>  x1_bar_SE <span class="ot">&lt;-</span> <span class="fu">sd</span>(x1) <span class="sc">/</span> <span class="fu">sqrt</span>(nsample)</span>
-<span id="cb183-63"><a href="boot.html#cb183-63" tabindex="-1"></a>  x2_bar_SE <span class="ot">&lt;-</span> <span class="fu">sd</span>(x2) <span class="sc">/</span> <span class="fu">sqrt</span>(nsample)</span>
-<span id="cb183-64"><a href="boot.html#cb183-64" tabindex="-1"></a>  x3_bar_SE <span class="ot">&lt;-</span> <span class="fu">sd</span>(x3) <span class="sc">/</span> <span class="fu">sqrt</span>(nsample)</span>
-<span id="cb183-65"><a href="boot.html#cb183-65" tabindex="-1"></a>  </span>
-<span id="cb183-66"><a href="boot.html#cb183-66" tabindex="-1"></a>  covers_asymp_norm[j,<span class="dv">1</span>] <span class="ot">&lt;-</span> <span class="fu">isin</span>(<span class="dv">0</span>, x1_bar <span class="sc">-</span> <span class="fl">1.96</span> <span class="sc">*</span> x1_bar_SE, x1_bar <span class="sc">+</span> <span class="fl">1.96</span> <span class="sc">*</span> x1_bar_SE)</span>
-<span id="cb183-67"><a href="boot.html#cb183-67" tabindex="-1"></a>  covers_asymp_norm[j,<span class="dv">2</span>] <span class="ot">&lt;-</span> <span class="fu">isin</span>(<span class="dv">1</span><span class="sc">/</span><span class="dv">3</span>, x2_bar <span class="sc">-</span> <span class="fl">1.96</span> <span class="sc">*</span> x2_bar_SE, x2_bar <span class="sc">+</span> <span class="fl">1.96</span> <span class="sc">*</span> x2_bar_SE)</span>
-<span id="cb183-68"><a href="boot.html#cb183-68" tabindex="-1"></a>  covers_asymp_norm[j,<span class="dv">3</span>] <span class="ot">&lt;-</span> <span class="fu">isin</span>(<span class="dv">5</span>, x3_bar <span class="sc">-</span> <span class="fl">1.96</span> <span class="sc">*</span> x3_bar_SE, x3_bar <span class="sc">+</span> <span class="fl">1.96</span> <span class="sc">*</span> x3_bar_SE)</span>
-<span id="cb183-69"><a href="boot.html#cb183-69" tabindex="-1"></a></span>
-<span id="cb183-70"><a href="boot.html#cb183-70" tabindex="-1"></a>}</span>
-<span id="cb183-71"><a href="boot.html#cb183-71" tabindex="-1"></a><span class="fu">apply</span>(covers, <span class="dv">2</span>, mean)</span></code></pre></div>
+<div class="sourceCode" id="cb1"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb1-1"><a href="boot.html#cb1-1" aria-hidden="true" tabindex="-1"></a><span class="fu">library</span>(boot)</span>
+<span id="cb1-2"><a href="boot.html#cb1-2" aria-hidden="true" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">0</span>)</span>
+<span id="cb1-3"><a href="boot.html#cb1-3" aria-hidden="true" tabindex="-1"></a>nit   <span class="ot">&lt;-</span> <span class="dv">1000</span>  <span class="co"># Repeat the process &quot;many times&quot;</span></span>
+<span id="cb1-4"><a href="boot.html#cb1-4" aria-hidden="true" tabindex="-1"></a>alpha <span class="ot">&lt;-</span> <span class="fl">0.05</span>  <span class="co"># CI parameter</span></span>
+<span id="cb1-5"><a href="boot.html#cb1-5" aria-hidden="true" tabindex="-1"></a>nboot <span class="ot">&lt;-</span> <span class="dv">100</span>   <span class="co"># m parameter for bootstrap (&quot;large enough m&quot;)</span></span>
+<span id="cb1-6"><a href="boot.html#cb1-6" aria-hidden="true" tabindex="-1"></a><span class="co"># f: change this to 200 or 5.</span></span>
+<span id="cb1-7"><a href="boot.html#cb1-7" aria-hidden="true" tabindex="-1"></a>nsample <span class="ot">&lt;-</span> <span class="dv">30</span>  <span class="co"># n = 30 random samples from the chosen distribution. Comment out BCa code if it breaks.</span></span>
+<span id="cb1-8"><a href="boot.html#cb1-8" aria-hidden="true" tabindex="-1"></a>covers     <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="at">nrow =</span> nit, <span class="at">ncol =</span> <span class="dv">3</span>)</span>
+<span id="cb1-9"><a href="boot.html#cb1-9" aria-hidden="true" tabindex="-1"></a>covers_BCa <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="at">nrow =</span> nit, <span class="at">ncol =</span> <span class="dv">3</span>)</span>
+<span id="cb1-10"><a href="boot.html#cb1-10" aria-hidden="true" tabindex="-1"></a>covers_asymp_norm <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="at">nrow =</span> nit, <span class="at">ncol =</span> <span class="dv">3</span>)</span>
+<span id="cb1-11"><a href="boot.html#cb1-11" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb1-12"><a href="boot.html#cb1-12" aria-hidden="true" tabindex="-1"></a>isin <span class="ot">&lt;-</span> <span class="cf">function</span> (x, lower, upper) {</span>
+<span id="cb1-13"><a href="boot.html#cb1-13" aria-hidden="true" tabindex="-1"></a>  (x <span class="sc">&gt;</span> lower) <span class="sc">&amp;</span> (x <span class="sc">&lt;</span> upper)</span>
+<span id="cb1-14"><a href="boot.html#cb1-14" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb1-15"><a href="boot.html#cb1-15" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb1-16"><a href="boot.html#cb1-16" aria-hidden="true" tabindex="-1"></a><span class="cf">for</span> (j <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>nit) {  <span class="co"># Repeating many times</span></span>
+<span id="cb1-17"><a href="boot.html#cb1-17" aria-hidden="true" tabindex="-1"></a>  <span class="co"># a: pick a univariate distribution - standard normal</span></span>
+<span id="cb1-18"><a href="boot.html#cb1-18" aria-hidden="true" tabindex="-1"></a>  x1 <span class="ot">&lt;-</span> <span class="fu">rnorm</span>(nsample)</span>
+<span id="cb1-19"><a href="boot.html#cb1-19" aria-hidden="true" tabindex="-1"></a>  </span>
+<span id="cb1-20"><a href="boot.html#cb1-20" aria-hidden="true" tabindex="-1"></a>  <span class="co"># c: one or two different distributions - beta and poisson</span></span>
+<span id="cb1-21"><a href="boot.html#cb1-21" aria-hidden="true" tabindex="-1"></a>  x2 <span class="ot">&lt;-</span> <span class="fu">rbeta</span>(nsample, <span class="dv">1</span>, <span class="dv">2</span>)</span>
+<span id="cb1-22"><a href="boot.html#cb1-22" aria-hidden="true" tabindex="-1"></a>  x3 <span class="ot">&lt;-</span> <span class="fu">rpois</span>(nsample, <span class="dv">5</span>)</span>
+<span id="cb1-23"><a href="boot.html#cb1-23" aria-hidden="true" tabindex="-1"></a>  </span>
+<span id="cb1-24"><a href="boot.html#cb1-24" aria-hidden="true" tabindex="-1"></a>  X1 <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="at">data =</span> <span class="cn">NA</span>, <span class="at">nrow =</span> nsample, <span class="at">ncol =</span> nboot)</span>
+<span id="cb1-25"><a href="boot.html#cb1-25" aria-hidden="true" tabindex="-1"></a>  X2 <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="at">data =</span> <span class="cn">NA</span>, <span class="at">nrow =</span> nsample, <span class="at">ncol =</span> nboot)</span>
+<span id="cb1-26"><a href="boot.html#cb1-26" aria-hidden="true" tabindex="-1"></a>  X3 <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="at">data =</span> <span class="cn">NA</span>, <span class="at">nrow =</span> nsample, <span class="at">ncol =</span> nboot)</span>
+<span id="cb1-27"><a href="boot.html#cb1-27" aria-hidden="true" tabindex="-1"></a>  <span class="cf">for</span> (i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>nboot) {</span>
+<span id="cb1-28"><a href="boot.html#cb1-28" aria-hidden="true" tabindex="-1"></a>    X1[ ,i] <span class="ot">&lt;-</span> <span class="fu">sample</span>(x1, nsample, <span class="at">replace =</span> T)</span>
+<span id="cb1-29"><a href="boot.html#cb1-29" aria-hidden="true" tabindex="-1"></a>    X2[ ,i] <span class="ot">&lt;-</span> <span class="fu">sample</span>(x2, nsample, T)</span>
+<span id="cb1-30"><a href="boot.html#cb1-30" aria-hidden="true" tabindex="-1"></a>    X3[ ,i] <span class="ot">&lt;-</span> <span class="fu">sample</span>(x3, nsample, T)</span>
+<span id="cb1-31"><a href="boot.html#cb1-31" aria-hidden="true" tabindex="-1"></a>  }</span>
+<span id="cb1-32"><a href="boot.html#cb1-32" aria-hidden="true" tabindex="-1"></a>  X1_func <span class="ot">&lt;-</span> <span class="fu">apply</span>(X1, <span class="dv">2</span>, mean)</span>
+<span id="cb1-33"><a href="boot.html#cb1-33" aria-hidden="true" tabindex="-1"></a>  X2_func <span class="ot">&lt;-</span> <span class="fu">apply</span>(X2, <span class="dv">2</span>, mean)</span>
+<span id="cb1-34"><a href="boot.html#cb1-34" aria-hidden="true" tabindex="-1"></a>  X3_func <span class="ot">&lt;-</span> <span class="fu">apply</span>(X3, <span class="dv">2</span>, mean)</span>
+<span id="cb1-35"><a href="boot.html#cb1-35" aria-hidden="true" tabindex="-1"></a>  X1_quant <span class="ot">&lt;-</span> <span class="fu">quantile</span>(X1_func, <span class="at">probs =</span> <span class="fu">c</span>(alpha <span class="sc">/</span> <span class="dv">2</span>, <span class="dv">1</span> <span class="sc">-</span> alpha <span class="sc">/</span> <span class="dv">2</span>))</span>
+<span id="cb1-36"><a href="boot.html#cb1-36" aria-hidden="true" tabindex="-1"></a>  X2_quant <span class="ot">&lt;-</span> <span class="fu">quantile</span>(X2_func, <span class="at">probs =</span> <span class="fu">c</span>(alpha <span class="sc">/</span> <span class="dv">2</span>, <span class="dv">1</span> <span class="sc">-</span> alpha <span class="sc">/</span> <span class="dv">2</span>))</span>
+<span id="cb1-37"><a href="boot.html#cb1-37" aria-hidden="true" tabindex="-1"></a>  X3_quant <span class="ot">&lt;-</span> <span class="fu">quantile</span>(X3_func, <span class="at">probs =</span> <span class="fu">c</span>(alpha <span class="sc">/</span> <span class="dv">2</span>, <span class="dv">1</span> <span class="sc">-</span> alpha <span class="sc">/</span> <span class="dv">2</span>))</span>
+<span id="cb1-38"><a href="boot.html#cb1-38" aria-hidden="true" tabindex="-1"></a>  covers[j,<span class="dv">1</span>] <span class="ot">&lt;-</span> (<span class="dv">0</span> <span class="sc">&gt;</span> X1_quant[<span class="dv">1</span>]) <span class="sc">&amp;</span> (<span class="dv">0</span> <span class="sc">&lt;</span> X1_quant[<span class="dv">2</span>])</span>
+<span id="cb1-39"><a href="boot.html#cb1-39" aria-hidden="true" tabindex="-1"></a>  covers[j,<span class="dv">2</span>] <span class="ot">&lt;-</span> ((<span class="dv">1</span> <span class="sc">/</span> <span class="dv">3</span>) <span class="sc">&gt;</span> X2_quant[<span class="dv">1</span>]) <span class="sc">&amp;</span> ((<span class="dv">1</span> <span class="sc">/</span> <span class="dv">3</span>) <span class="sc">&lt;</span> X2_quant[<span class="dv">2</span>])</span>
+<span id="cb1-40"><a href="boot.html#cb1-40" aria-hidden="true" tabindex="-1"></a>  covers[j,<span class="dv">3</span>] <span class="ot">&lt;-</span> (<span class="dv">5</span> <span class="sc">&gt;</span> X3_quant[<span class="dv">1</span>]) <span class="sc">&amp;</span> (<span class="dv">5</span> <span class="sc">&lt;</span> X3_quant[<span class="dv">2</span>])</span>
+<span id="cb1-41"><a href="boot.html#cb1-41" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb1-42"><a href="boot.html#cb1-42" aria-hidden="true" tabindex="-1"></a>  mf     <span class="ot">&lt;-</span> <span class="cf">function</span> (x, i) <span class="fu">return</span>(<span class="fu">mean</span>(x[i]))</span>
+<span id="cb1-43"><a href="boot.html#cb1-43" aria-hidden="true" tabindex="-1"></a>  bootX1 <span class="ot">&lt;-</span> <span class="fu">boot</span>(x1, <span class="at">statistic =</span> mf, <span class="at">R =</span> nboot)</span>
+<span id="cb1-44"><a href="boot.html#cb1-44" aria-hidden="true" tabindex="-1"></a>  bootX2 <span class="ot">&lt;-</span> <span class="fu">boot</span>(x2, <span class="at">statistic =</span> mf, <span class="at">R =</span> nboot)</span>
+<span id="cb1-45"><a href="boot.html#cb1-45" aria-hidden="true" tabindex="-1"></a>  bootX3 <span class="ot">&lt;-</span> <span class="fu">boot</span>(x3, <span class="at">statistic =</span> mf, <span class="at">R =</span> nboot)</span>
+<span id="cb1-46"><a href="boot.html#cb1-46" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb1-47"><a href="boot.html#cb1-47" aria-hidden="true" tabindex="-1"></a>  X1_quant_BCa <span class="ot">&lt;-</span> <span class="fu">boot.ci</span>(bootX1, <span class="at">type =</span> <span class="st">&quot;bca&quot;</span>)<span class="sc">$</span>bca</span>
+<span id="cb1-48"><a href="boot.html#cb1-48" aria-hidden="true" tabindex="-1"></a>  X2_quant_BCa <span class="ot">&lt;-</span> <span class="fu">boot.ci</span>(bootX2, <span class="at">type =</span> <span class="st">&quot;bca&quot;</span>)<span class="sc">$</span>bca</span>
+<span id="cb1-49"><a href="boot.html#cb1-49" aria-hidden="true" tabindex="-1"></a>  X3_quant_BCa <span class="ot">&lt;-</span> <span class="fu">boot.ci</span>(bootX3, <span class="at">type =</span> <span class="st">&quot;bca&quot;</span>)<span class="sc">$</span>bca</span>
+<span id="cb1-50"><a href="boot.html#cb1-50" aria-hidden="true" tabindex="-1"></a>  </span>
+<span id="cb1-51"><a href="boot.html#cb1-51" aria-hidden="true" tabindex="-1"></a>  covers_BCa[j,<span class="dv">1</span>] <span class="ot">&lt;-</span> (<span class="dv">0</span> <span class="sc">&gt;</span> X1_quant_BCa[<span class="dv">4</span>]) <span class="sc">&amp;</span> (<span class="dv">0</span> <span class="sc">&lt;</span> X1_quant_BCa[<span class="dv">5</span>])</span>
+<span id="cb1-52"><a href="boot.html#cb1-52" aria-hidden="true" tabindex="-1"></a>  covers_BCa[j,<span class="dv">2</span>] <span class="ot">&lt;-</span> ((<span class="dv">1</span> <span class="sc">/</span> <span class="dv">3</span>) <span class="sc">&gt;</span> X2_quant_BCa[<span class="dv">4</span>]) <span class="sc">&amp;</span> ((<span class="dv">1</span> <span class="sc">/</span> <span class="dv">3</span>) <span class="sc">&lt;</span> X2_quant_BCa[<span class="dv">5</span>])</span>
+<span id="cb1-53"><a href="boot.html#cb1-53" aria-hidden="true" tabindex="-1"></a>  covers_BCa[j,<span class="dv">3</span>] <span class="ot">&lt;-</span> (<span class="dv">5</span> <span class="sc">&gt;</span> X3_quant_BCa[<span class="dv">4</span>]) <span class="sc">&amp;</span> (<span class="dv">5</span> <span class="sc">&lt;</span> X3_quant_BCa[<span class="dv">5</span>])</span>
+<span id="cb1-54"><a href="boot.html#cb1-54" aria-hidden="true" tabindex="-1"></a>  </span>
+<span id="cb1-55"><a href="boot.html#cb1-55" aria-hidden="true" tabindex="-1"></a>  <span class="co"># e: estimate mean and standard error</span></span>
+<span id="cb1-56"><a href="boot.html#cb1-56" aria-hidden="true" tabindex="-1"></a>  <span class="co"># sample mean:</span></span>
+<span id="cb1-57"><a href="boot.html#cb1-57" aria-hidden="true" tabindex="-1"></a>  x1_bar <span class="ot">&lt;-</span> <span class="fu">mean</span>(x1)</span>
+<span id="cb1-58"><a href="boot.html#cb1-58" aria-hidden="true" tabindex="-1"></a>  x2_bar <span class="ot">&lt;-</span> <span class="fu">mean</span>(x2)</span>
+<span id="cb1-59"><a href="boot.html#cb1-59" aria-hidden="true" tabindex="-1"></a>  x3_bar <span class="ot">&lt;-</span> <span class="fu">mean</span>(x3)</span>
+<span id="cb1-60"><a href="boot.html#cb1-60" aria-hidden="true" tabindex="-1"></a>  </span>
+<span id="cb1-61"><a href="boot.html#cb1-61" aria-hidden="true" tabindex="-1"></a>  <span class="co"># standard error (of the sample mean) estimate: sample standard deviation / sqrt(n)</span></span>
+<span id="cb1-62"><a href="boot.html#cb1-62" aria-hidden="true" tabindex="-1"></a>  x1_bar_SE <span class="ot">&lt;-</span> <span class="fu">sd</span>(x1) <span class="sc">/</span> <span class="fu">sqrt</span>(nsample)</span>
+<span id="cb1-63"><a href="boot.html#cb1-63" aria-hidden="true" tabindex="-1"></a>  x2_bar_SE <span class="ot">&lt;-</span> <span class="fu">sd</span>(x2) <span class="sc">/</span> <span class="fu">sqrt</span>(nsample)</span>
+<span id="cb1-64"><a href="boot.html#cb1-64" aria-hidden="true" tabindex="-1"></a>  x3_bar_SE <span class="ot">&lt;-</span> <span class="fu">sd</span>(x3) <span class="sc">/</span> <span class="fu">sqrt</span>(nsample)</span>
+<span id="cb1-65"><a href="boot.html#cb1-65" aria-hidden="true" tabindex="-1"></a>  </span>
+<span id="cb1-66"><a href="boot.html#cb1-66" aria-hidden="true" tabindex="-1"></a>  covers_asymp_norm[j,<span class="dv">1</span>] <span class="ot">&lt;-</span> <span class="fu">isin</span>(<span class="dv">0</span>, x1_bar <span class="sc">-</span> <span class="fl">1.96</span> <span class="sc">*</span> x1_bar_SE, x1_bar <span class="sc">+</span> <span class="fl">1.96</span> <span class="sc">*</span> x1_bar_SE)</span>
+<span id="cb1-67"><a href="boot.html#cb1-67" aria-hidden="true" tabindex="-1"></a>  covers_asymp_norm[j,<span class="dv">2</span>] <span class="ot">&lt;-</span> <span class="fu">isin</span>(<span class="dv">1</span><span class="sc">/</span><span class="dv">3</span>, x2_bar <span class="sc">-</span> <span class="fl">1.96</span> <span class="sc">*</span> x2_bar_SE, x2_bar <span class="sc">+</span> <span class="fl">1.96</span> <span class="sc">*</span> x2_bar_SE)</span>
+<span id="cb1-68"><a href="boot.html#cb1-68" aria-hidden="true" tabindex="-1"></a>  covers_asymp_norm[j,<span class="dv">3</span>] <span class="ot">&lt;-</span> <span class="fu">isin</span>(<span class="dv">5</span>, x3_bar <span class="sc">-</span> <span class="fl">1.96</span> <span class="sc">*</span> x3_bar_SE, x3_bar <span class="sc">+</span> <span class="fl">1.96</span> <span class="sc">*</span> x3_bar_SE)</span>
+<span id="cb1-69"><a href="boot.html#cb1-69" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb1-70"><a href="boot.html#cb1-70" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb1-71"><a href="boot.html#cb1-71" aria-hidden="true" tabindex="-1"></a><span class="fu">apply</span>(covers, <span class="dv">2</span>, mean)</span></code></pre></div>
 <pre><code>## [1] 0.918 0.925 0.905</code></pre>
-<div class="sourceCode" id="cb185"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb185-1"><a href="boot.html#cb185-1" tabindex="-1"></a><span class="fu">apply</span>(covers, <span class="dv">2</span>, sd) <span class="sc">/</span> <span class="fu">sqrt</span>(nit)</span></code></pre></div>
+<div class="sourceCode" id="cb3"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb3-1"><a href="boot.html#cb3-1" aria-hidden="true" tabindex="-1"></a><span class="fu">apply</span>(covers, <span class="dv">2</span>, sd) <span class="sc">/</span> <span class="fu">sqrt</span>(nit)</span></code></pre></div>
 <pre><code>## [1] 0.008680516 0.008333333 0.009276910</code></pre>
-<div class="sourceCode" id="cb187"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb187-1"><a href="boot.html#cb187-1" tabindex="-1"></a><span class="fu">apply</span>(covers_BCa, <span class="dv">2</span>, mean)</span></code></pre></div>
+<div class="sourceCode" id="cb5"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb5-1"><a href="boot.html#cb5-1" aria-hidden="true" tabindex="-1"></a><span class="fu">apply</span>(covers_BCa, <span class="dv">2</span>, mean)</span></code></pre></div>
 <pre><code>## [1] 0.927 0.944 0.927</code></pre>
-<div class="sourceCode" id="cb189"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb189-1"><a href="boot.html#cb189-1" tabindex="-1"></a><span class="fu">apply</span>(covers_BCa, <span class="dv">2</span>, sd) <span class="sc">/</span> <span class="fu">sqrt</span>(nit)</span></code></pre></div>
+<div class="sourceCode" id="cb7"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb7-1"><a href="boot.html#cb7-1" aria-hidden="true" tabindex="-1"></a><span class="fu">apply</span>(covers_BCa, <span class="dv">2</span>, sd) <span class="sc">/</span> <span class="fu">sqrt</span>(nit)</span></code></pre></div>
 <pre><code>## [1] 0.008230355 0.007274401 0.008230355</code></pre>
-<div class="sourceCode" id="cb191"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb191-1"><a href="boot.html#cb191-1" tabindex="-1"></a><span class="fu">apply</span>(covers_asymp_norm, <span class="dv">2</span>, mean)</span></code></pre></div>
+<div class="sourceCode" id="cb9"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb9-1"><a href="boot.html#cb9-1" aria-hidden="true" tabindex="-1"></a><span class="fu">apply</span>(covers_asymp_norm, <span class="dv">2</span>, mean)</span></code></pre></div>
 <pre><code>## [1] 0.939 0.937 0.930</code></pre>
-<div class="sourceCode" id="cb193"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb193-1"><a href="boot.html#cb193-1" tabindex="-1"></a><span class="fu">apply</span>(covers_asymp_norm, <span class="dv">2</span>, sd) <span class="sc">/</span> <span class="fu">sqrt</span>(nit)</span></code></pre></div>
+<div class="sourceCode" id="cb11"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb11-1"><a href="boot.html#cb11-1" aria-hidden="true" tabindex="-1"></a><span class="fu">apply</span>(covers_asymp_norm, <span class="dv">2</span>, sd) <span class="sc">/</span> <span class="fu">sqrt</span>(nit)</span></code></pre></div>
 <pre><code>## [1] 0.007572076 0.007687008 0.008072494</code></pre>
 </div>
 <div class="exercise">
-<p><span id="exr:unnamed-chunk-225" class="exercise"><strong>Exercise 14.2  </strong></span><span style="color:blue">
+<p><span id="exr:unnamed-chunk-4" class="exercise"><strong>Exercise 14.2  </strong></span><span style="color:blue">
 You are given a sample of independent observations from a process of interest:</p>
 <table>
 <thead>
@@ -460,41 +460,41 @@ <h1><span class="header-section-number">Chapter 14</span> Bootstrap<a href="boot
 </ol>
 </div>
 <div class="fold">
-<div class="sourceCode" id="cb195"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb195-1"><a href="boot.html#cb195-1" tabindex="-1"></a><span class="co"># a</span></span>
-<span id="cb195-2"><a href="boot.html#cb195-2" tabindex="-1"></a>x <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">7</span>, <span class="dv">2</span>, <span class="dv">4</span>, <span class="dv">6</span>, <span class="dv">4</span>, <span class="dv">5</span>, <span class="dv">9</span>, <span class="dv">10</span>)</span>
-<span id="cb195-3"><a href="boot.html#cb195-3" tabindex="-1"></a>n <span class="ot">&lt;-</span> <span class="fu">length</span>(x)</span>
-<span id="cb195-4"><a href="boot.html#cb195-4" tabindex="-1"></a>mu <span class="ot">&lt;-</span> <span class="fu">mean</span>(x)</span>
-<span id="cb195-5"><a href="boot.html#cb195-5" tabindex="-1"></a></span>
-<span id="cb195-6"><a href="boot.html#cb195-6" tabindex="-1"></a>SE <span class="ot">&lt;-</span> <span class="fu">sqrt</span>(<span class="fu">mean</span>((x <span class="sc">-</span> mu)<span class="sc">^</span><span class="dv">2</span>)) <span class="sc">/</span> <span class="fu">sqrt</span>(n)</span>
-<span id="cb195-7"><a href="boot.html#cb195-7" tabindex="-1"></a>SE</span></code></pre></div>
+<div class="sourceCode" id="cb13"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb13-1"><a href="boot.html#cb13-1" aria-hidden="true" tabindex="-1"></a><span class="co"># a</span></span>
+<span id="cb13-2"><a href="boot.html#cb13-2" aria-hidden="true" tabindex="-1"></a>x <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">7</span>, <span class="dv">2</span>, <span class="dv">4</span>, <span class="dv">6</span>, <span class="dv">4</span>, <span class="dv">5</span>, <span class="dv">9</span>, <span class="dv">10</span>)</span>
+<span id="cb13-3"><a href="boot.html#cb13-3" aria-hidden="true" tabindex="-1"></a>n <span class="ot">&lt;-</span> <span class="fu">length</span>(x)</span>
+<span id="cb13-4"><a href="boot.html#cb13-4" aria-hidden="true" tabindex="-1"></a>mu <span class="ot">&lt;-</span> <span class="fu">mean</span>(x)</span>
+<span id="cb13-5"><a href="boot.html#cb13-5" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb13-6"><a href="boot.html#cb13-6" aria-hidden="true" tabindex="-1"></a>SE <span class="ot">&lt;-</span> <span class="fu">sqrt</span>(<span class="fu">mean</span>((x <span class="sc">-</span> mu)<span class="sc">^</span><span class="dv">2</span>)) <span class="sc">/</span> <span class="fu">sqrt</span>(n)</span>
+<span id="cb13-7"><a href="boot.html#cb13-7" aria-hidden="true" tabindex="-1"></a>SE</span></code></pre></div>
 <pre><code>## [1] 0.8915839</code></pre>
-<div class="sourceCode" id="cb197"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb197-1"><a href="boot.html#cb197-1" tabindex="-1"></a>z <span class="ot">&lt;-</span> <span class="fu">qnorm</span>(<span class="dv">1</span> <span class="sc">-</span> <span class="fl">0.05</span> <span class="sc">/</span> <span class="dv">2</span>)</span>
-<span id="cb197-2"><a href="boot.html#cb197-2" tabindex="-1"></a><span class="fu">c</span>(mu <span class="sc">-</span> z <span class="sc">*</span> SE, mu <span class="sc">+</span> z <span class="sc">*</span> SE)</span></code></pre></div>
+<div class="sourceCode" id="cb15"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb15-1"><a href="boot.html#cb15-1" aria-hidden="true" tabindex="-1"></a>z <span class="ot">&lt;-</span> <span class="fu">qnorm</span>(<span class="dv">1</span> <span class="sc">-</span> <span class="fl">0.05</span> <span class="sc">/</span> <span class="dv">2</span>)</span>
+<span id="cb15-2"><a href="boot.html#cb15-2" aria-hidden="true" tabindex="-1"></a><span class="fu">c</span>(mu <span class="sc">-</span> z <span class="sc">*</span> SE, mu <span class="sc">+</span> z <span class="sc">*</span> SE)</span></code></pre></div>
 <pre><code>## [1] 4.127528 7.622472</code></pre>
-<div class="sourceCode" id="cb199"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb199-1"><a href="boot.html#cb199-1" tabindex="-1"></a><span class="co"># b</span></span>
-<span id="cb199-2"><a href="boot.html#cb199-2" tabindex="-1"></a>SE <span class="ot">&lt;-</span> <span class="fu">sd</span>(x) <span class="sc">/</span> <span class="fu">sqrt</span>(n)</span>
-<span id="cb199-3"><a href="boot.html#cb199-3" tabindex="-1"></a>SE</span></code></pre></div>
+<div class="sourceCode" id="cb17"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb17-1"><a href="boot.html#cb17-1" aria-hidden="true" tabindex="-1"></a><span class="co"># b</span></span>
+<span id="cb17-2"><a href="boot.html#cb17-2" aria-hidden="true" tabindex="-1"></a>SE <span class="ot">&lt;-</span> <span class="fu">sd</span>(x) <span class="sc">/</span> <span class="fu">sqrt</span>(n)</span>
+<span id="cb17-3"><a href="boot.html#cb17-3" aria-hidden="true" tabindex="-1"></a>SE</span></code></pre></div>
 <pre><code>## [1] 0.9531433</code></pre>
-<div class="sourceCode" id="cb201"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb201-1"><a href="boot.html#cb201-1" tabindex="-1"></a><span class="fu">c</span>(mu <span class="sc">-</span> z <span class="sc">*</span> SE, mu <span class="sc">+</span> z <span class="sc">*</span> SE)</span></code></pre></div>
+<div class="sourceCode" id="cb19"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb19-1"><a href="boot.html#cb19-1" aria-hidden="true" tabindex="-1"></a><span class="fu">c</span>(mu <span class="sc">-</span> z <span class="sc">*</span> SE, mu <span class="sc">+</span> z <span class="sc">*</span> SE)</span></code></pre></div>
 <pre><code>## [1] 4.006873 7.743127</code></pre>
-<div class="sourceCode" id="cb203"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb203-1"><a href="boot.html#cb203-1" tabindex="-1"></a><span class="co"># c</span></span>
-<span id="cb203-2"><a href="boot.html#cb203-2" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">0</span>)</span>
-<span id="cb203-3"><a href="boot.html#cb203-3" tabindex="-1"></a></span>
-<span id="cb203-4"><a href="boot.html#cb203-4" tabindex="-1"></a>m  <span class="ot">&lt;-</span> <span class="dv">1000</span></span>
-<span id="cb203-5"><a href="boot.html#cb203-5" tabindex="-1"></a>T_mean <span class="ot">&lt;-</span> <span class="cf">function</span>(x) {<span class="fu">mean</span>(x)}</span>
-<span id="cb203-6"><a href="boot.html#cb203-6" tabindex="-1"></a></span>
-<span id="cb203-7"><a href="boot.html#cb203-7" tabindex="-1"></a>est_boot <span class="ot">&lt;-</span> <span class="fu">array</span>(<span class="cn">NA</span>, m)</span>
-<span id="cb203-8"><a href="boot.html#cb203-8" tabindex="-1"></a><span class="cf">for</span> (i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>m) {</span>
-<span id="cb203-9"><a href="boot.html#cb203-9" tabindex="-1"></a>  x_boot <span class="ot">&lt;-</span> x[<span class="fu">sample</span>(<span class="dv">1</span><span class="sc">:</span>n, n, <span class="at">rep =</span> T)]</span>
-<span id="cb203-10"><a href="boot.html#cb203-10" tabindex="-1"></a>  est_boot[i] <span class="ot">&lt;-</span> <span class="fu">T_mean</span>(x_boot)</span>
-<span id="cb203-11"><a href="boot.html#cb203-11" tabindex="-1"></a>}</span>
-<span id="cb203-12"><a href="boot.html#cb203-12" tabindex="-1"></a></span>
-<span id="cb203-13"><a href="boot.html#cb203-13" tabindex="-1"></a><span class="fu">quantile</span>(est_boot, <span class="at">p =</span> <span class="fu">c</span>(<span class="fl">0.025</span>, <span class="fl">0.975</span>))</span></code></pre></div>
+<div class="sourceCode" id="cb21"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb21-1"><a href="boot.html#cb21-1" aria-hidden="true" tabindex="-1"></a><span class="co"># c</span></span>
+<span id="cb21-2"><a href="boot.html#cb21-2" aria-hidden="true" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">0</span>)</span>
+<span id="cb21-3"><a href="boot.html#cb21-3" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb21-4"><a href="boot.html#cb21-4" aria-hidden="true" tabindex="-1"></a>m  <span class="ot">&lt;-</span> <span class="dv">1000</span></span>
+<span id="cb21-5"><a href="boot.html#cb21-5" aria-hidden="true" tabindex="-1"></a>T_mean <span class="ot">&lt;-</span> <span class="cf">function</span>(x) {<span class="fu">mean</span>(x)}</span>
+<span id="cb21-6"><a href="boot.html#cb21-6" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb21-7"><a href="boot.html#cb21-7" aria-hidden="true" tabindex="-1"></a>est_boot <span class="ot">&lt;-</span> <span class="fu">array</span>(<span class="cn">NA</span>, m)</span>
+<span id="cb21-8"><a href="boot.html#cb21-8" aria-hidden="true" tabindex="-1"></a><span class="cf">for</span> (i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>m) {</span>
+<span id="cb21-9"><a href="boot.html#cb21-9" aria-hidden="true" tabindex="-1"></a>  x_boot <span class="ot">&lt;-</span> x[<span class="fu">sample</span>(<span class="dv">1</span><span class="sc">:</span>n, n, <span class="at">rep =</span> T)]</span>
+<span id="cb21-10"><a href="boot.html#cb21-10" aria-hidden="true" tabindex="-1"></a>  est_boot[i] <span class="ot">&lt;-</span> <span class="fu">T_mean</span>(x_boot)</span>
+<span id="cb21-11"><a href="boot.html#cb21-11" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb21-12"><a href="boot.html#cb21-12" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb21-13"><a href="boot.html#cb21-13" aria-hidden="true" tabindex="-1"></a><span class="fu">quantile</span>(est_boot, <span class="at">p =</span> <span class="fu">c</span>(<span class="fl">0.025</span>, <span class="fl">0.975</span>))</span></code></pre></div>
 <pre><code>##  2.5% 97.5% 
 ## 4.250 7.625</code></pre>
 </div>
 <div class="exercise">
-<p><span id="exr:unnamed-chunk-227" class="exercise"><strong>Exercise 14.3  </strong></span><span style="color:blue">
+<p><span id="exr:unnamed-chunk-6" class="exercise"><strong>Exercise 14.3  </strong></span><span style="color:blue">
 We are given a sample of 10 independent paired (bivariate) observations:</p>
 <table>
 <colgroup>
@@ -564,59 +564,59 @@ <h1><span class="header-section-number">Chapter 14</span> Bootstrap<a href="boot
 </ol>
 </div>
 <div class="fold">
-<div class="sourceCode" id="cb205"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb205-1"><a href="boot.html#cb205-1" tabindex="-1"></a>x <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="fl">1.26</span>, <span class="sc">-</span><span class="fl">0.33</span>,  <span class="fl">1.33</span>,  <span class="fl">1.27</span>,  <span class="fl">0.41</span>, <span class="sc">-</span><span class="fl">1.54</span>, <span class="sc">-</span><span class="fl">0.93</span>, <span class="sc">-</span><span class="fl">0.29</span>, <span class="sc">-</span><span class="fl">0.01</span>,  <span class="fl">2.40</span>)</span>
-<span id="cb205-2"><a href="boot.html#cb205-2" tabindex="-1"></a>y <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="fl">2.64</span>,  <span class="fl">0.33</span>,  <span class="fl">0.48</span>,  <span class="fl">0.06</span>, <span class="sc">-</span><span class="fl">0.88</span>, <span class="sc">-</span><span class="fl">2.14</span>, <span class="sc">-</span><span class="fl">2.21</span>,  <span class="fl">0.95</span>,  <span class="fl">0.83</span>,  <span class="fl">1.45</span>)</span>
-<span id="cb205-3"><a href="boot.html#cb205-3" tabindex="-1"></a></span>
-<span id="cb205-4"><a href="boot.html#cb205-4" tabindex="-1"></a><span class="co"># a</span></span>
-<span id="cb205-5"><a href="boot.html#cb205-5" tabindex="-1"></a><span class="fu">cor</span>(x, y)</span></code></pre></div>
+<div class="sourceCode" id="cb23"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb23-1"><a href="boot.html#cb23-1" aria-hidden="true" tabindex="-1"></a>x <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="fl">1.26</span>, <span class="sc">-</span><span class="fl">0.33</span>,  <span class="fl">1.33</span>,  <span class="fl">1.27</span>,  <span class="fl">0.41</span>, <span class="sc">-</span><span class="fl">1.54</span>, <span class="sc">-</span><span class="fl">0.93</span>, <span class="sc">-</span><span class="fl">0.29</span>, <span class="sc">-</span><span class="fl">0.01</span>,  <span class="fl">2.40</span>)</span>
+<span id="cb23-2"><a href="boot.html#cb23-2" aria-hidden="true" tabindex="-1"></a>y <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="fl">2.64</span>,  <span class="fl">0.33</span>,  <span class="fl">0.48</span>,  <span class="fl">0.06</span>, <span class="sc">-</span><span class="fl">0.88</span>, <span class="sc">-</span><span class="fl">2.14</span>, <span class="sc">-</span><span class="fl">2.21</span>,  <span class="fl">0.95</span>,  <span class="fl">0.83</span>,  <span class="fl">1.45</span>)</span>
+<span id="cb23-3"><a href="boot.html#cb23-3" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb23-4"><a href="boot.html#cb23-4" aria-hidden="true" tabindex="-1"></a><span class="co"># a</span></span>
+<span id="cb23-5"><a href="boot.html#cb23-5" aria-hidden="true" tabindex="-1"></a><span class="fu">cor</span>(x, y)</span></code></pre></div>
 <pre><code>## [1] 0.6991247</code></pre>
-<div class="sourceCode" id="cb207"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb207-1"><a href="boot.html#cb207-1" tabindex="-1"></a><span class="co"># b</span></span>
-<span id="cb207-2"><a href="boot.html#cb207-2" tabindex="-1"></a>res <span class="ot">&lt;-</span> <span class="fu">cor.test</span>(x, y)</span>
-<span id="cb207-3"><a href="boot.html#cb207-3" tabindex="-1"></a>res<span class="sc">$</span>conf.int[<span class="dv">1</span><span class="sc">:</span><span class="dv">2</span>]</span></code></pre></div>
+<div class="sourceCode" id="cb25"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb25-1"><a href="boot.html#cb25-1" aria-hidden="true" tabindex="-1"></a><span class="co"># b</span></span>
+<span id="cb25-2"><a href="boot.html#cb25-2" aria-hidden="true" tabindex="-1"></a>res <span class="ot">&lt;-</span> <span class="fu">cor.test</span>(x, y)</span>
+<span id="cb25-3"><a href="boot.html#cb25-3" aria-hidden="true" tabindex="-1"></a>res<span class="sc">$</span>conf.int[<span class="dv">1</span><span class="sc">:</span><span class="dv">2</span>]</span></code></pre></div>
 <pre><code>## [1] 0.1241458 0.9226238</code></pre>
-<div class="sourceCode" id="cb209"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb209-1"><a href="boot.html#cb209-1" tabindex="-1"></a><span class="co"># c</span></span>
-<span id="cb209-2"><a href="boot.html#cb209-2" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">0</span>)</span>
-<span id="cb209-3"><a href="boot.html#cb209-3" tabindex="-1"></a>m  <span class="ot">&lt;-</span> <span class="dv">1000</span></span>
-<span id="cb209-4"><a href="boot.html#cb209-4" tabindex="-1"></a>n  <span class="ot">&lt;-</span> <span class="fu">length</span>(x) </span>
-<span id="cb209-5"><a href="boot.html#cb209-5" tabindex="-1"></a>T_cor <span class="ot">&lt;-</span> <span class="cf">function</span>(x, y) {<span class="fu">cor</span>(x, y)}</span>
-<span id="cb209-6"><a href="boot.html#cb209-6" tabindex="-1"></a></span>
-<span id="cb209-7"><a href="boot.html#cb209-7" tabindex="-1"></a>est_boot <span class="ot">&lt;-</span> <span class="fu">array</span>(<span class="cn">NA</span>, m)</span>
-<span id="cb209-8"><a href="boot.html#cb209-8" tabindex="-1"></a><span class="cf">for</span> (i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>m) {</span>
-<span id="cb209-9"><a href="boot.html#cb209-9" tabindex="-1"></a>  idx <span class="ot">&lt;-</span> <span class="fu">sample</span>(<span class="dv">1</span><span class="sc">:</span>n, n, <span class="at">rep =</span> T) <span class="co"># !!! important to use same indices to keep dependency between x and y</span></span>
-<span id="cb209-10"><a href="boot.html#cb209-10" tabindex="-1"></a>  est_boot[i] <span class="ot">&lt;-</span> <span class="fu">T_cor</span>(x[idx], y[idx])</span>
-<span id="cb209-11"><a href="boot.html#cb209-11" tabindex="-1"></a>}</span>
-<span id="cb209-12"><a href="boot.html#cb209-12" tabindex="-1"></a></span>
-<span id="cb209-13"><a href="boot.html#cb209-13" tabindex="-1"></a><span class="fu">quantile</span>(est_boot, <span class="at">p =</span> <span class="fu">c</span>(<span class="fl">0.025</span>, <span class="fl">0.975</span>))</span></code></pre></div>
+<div class="sourceCode" id="cb27"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb27-1"><a href="boot.html#cb27-1" aria-hidden="true" tabindex="-1"></a><span class="co"># c</span></span>
+<span id="cb27-2"><a href="boot.html#cb27-2" aria-hidden="true" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">0</span>)</span>
+<span id="cb27-3"><a href="boot.html#cb27-3" aria-hidden="true" tabindex="-1"></a>m  <span class="ot">&lt;-</span> <span class="dv">1000</span></span>
+<span id="cb27-4"><a href="boot.html#cb27-4" aria-hidden="true" tabindex="-1"></a>n  <span class="ot">&lt;-</span> <span class="fu">length</span>(x) </span>
+<span id="cb27-5"><a href="boot.html#cb27-5" aria-hidden="true" tabindex="-1"></a>T_cor <span class="ot">&lt;-</span> <span class="cf">function</span>(x, y) {<span class="fu">cor</span>(x, y)}</span>
+<span id="cb27-6"><a href="boot.html#cb27-6" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb27-7"><a href="boot.html#cb27-7" aria-hidden="true" tabindex="-1"></a>est_boot <span class="ot">&lt;-</span> <span class="fu">array</span>(<span class="cn">NA</span>, m)</span>
+<span id="cb27-8"><a href="boot.html#cb27-8" aria-hidden="true" tabindex="-1"></a><span class="cf">for</span> (i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>m) {</span>
+<span id="cb27-9"><a href="boot.html#cb27-9" aria-hidden="true" tabindex="-1"></a>  idx <span class="ot">&lt;-</span> <span class="fu">sample</span>(<span class="dv">1</span><span class="sc">:</span>n, n, <span class="at">rep =</span> T) <span class="co"># !!! important to use same indices to keep dependency between x and y</span></span>
+<span id="cb27-10"><a href="boot.html#cb27-10" aria-hidden="true" tabindex="-1"></a>  est_boot[i] <span class="ot">&lt;-</span> <span class="fu">T_cor</span>(x[idx], y[idx])</span>
+<span id="cb27-11"><a href="boot.html#cb27-11" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb27-12"><a href="boot.html#cb27-12" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb27-13"><a href="boot.html#cb27-13" aria-hidden="true" tabindex="-1"></a><span class="fu">quantile</span>(est_boot, <span class="at">p =</span> <span class="fu">c</span>(<span class="fl">0.025</span>, <span class="fl">0.975</span>))</span></code></pre></div>
 <pre><code>##      2.5%     97.5% 
 ## 0.2565537 0.9057664</code></pre>
-<div class="sourceCode" id="cb211"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb211-1"><a href="boot.html#cb211-1" tabindex="-1"></a><span class="co"># d</span></span>
-<span id="cb211-2"><a href="boot.html#cb211-2" tabindex="-1"></a><span class="co"># Yes, but the bootstrap CI is more narrow.</span></span>
-<span id="cb211-3"><a href="boot.html#cb211-3" tabindex="-1"></a></span>
-<span id="cb211-4"><a href="boot.html#cb211-4" tabindex="-1"></a><span class="co"># e</span></span>
-<span id="cb211-5"><a href="boot.html#cb211-5" tabindex="-1"></a><span class="co"># We just use the functions for Kendall/Spearman coefficients instead:</span></span>
-<span id="cb211-6"><a href="boot.html#cb211-6" tabindex="-1"></a>T_kendall <span class="ot">&lt;-</span> <span class="cf">function</span>(x, y) {<span class="fu">cor</span>(x, y, <span class="at">method =</span> <span class="st">&quot;kendall&quot;</span>)}</span>
-<span id="cb211-7"><a href="boot.html#cb211-7" tabindex="-1"></a>T_spearman <span class="ot">&lt;-</span> <span class="cf">function</span>(x, y) {<span class="fu">cor</span>(x, y, <span class="at">method =</span> <span class="st">&quot;spearman&quot;</span>)}</span>
-<span id="cb211-8"><a href="boot.html#cb211-8" tabindex="-1"></a></span>
-<span id="cb211-9"><a href="boot.html#cb211-9" tabindex="-1"></a><span class="co"># Put this in a function that returns the CI</span></span>
-<span id="cb211-10"><a href="boot.html#cb211-10" tabindex="-1"></a>bootstrap_95_ci <span class="ot">&lt;-</span> <span class="cf">function</span>(x, y, t, <span class="at">m =</span> <span class="dv">1000</span>) {</span>
-<span id="cb211-11"><a href="boot.html#cb211-11" tabindex="-1"></a>  n <span class="ot">&lt;-</span> <span class="fu">length</span>(x)</span>
-<span id="cb211-12"><a href="boot.html#cb211-12" tabindex="-1"></a>  est_boot <span class="ot">&lt;-</span> <span class="fu">array</span>(<span class="cn">NA</span>, m)</span>
-<span id="cb211-13"><a href="boot.html#cb211-13" tabindex="-1"></a>  <span class="cf">for</span> (i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>m) {</span>
-<span id="cb211-14"><a href="boot.html#cb211-14" tabindex="-1"></a>    idx <span class="ot">&lt;-</span> <span class="fu">sample</span>(<span class="dv">1</span><span class="sc">:</span>n, n, <span class="at">rep =</span> T) <span class="co"># !!! important to use same indices to keep dependency between x and y</span></span>
-<span id="cb211-15"><a href="boot.html#cb211-15" tabindex="-1"></a>    est_boot[i] <span class="ot">&lt;-</span> <span class="fu">t</span>(x[idx], y[idx])</span>
-<span id="cb211-16"><a href="boot.html#cb211-16" tabindex="-1"></a>  }</span>
-<span id="cb211-17"><a href="boot.html#cb211-17" tabindex="-1"></a>  <span class="fu">quantile</span>(est_boot, <span class="at">p =</span> <span class="fu">c</span>(<span class="fl">0.025</span>, <span class="fl">0.975</span>))</span>
-<span id="cb211-18"><a href="boot.html#cb211-18" tabindex="-1"></a>}</span>
-<span id="cb211-19"><a href="boot.html#cb211-19" tabindex="-1"></a></span>
-<span id="cb211-20"><a href="boot.html#cb211-20" tabindex="-1"></a><span class="fu">bootstrap_95_ci</span>(x, y, T_kendall)</span></code></pre></div>
+<div class="sourceCode" id="cb29"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb29-1"><a href="boot.html#cb29-1" aria-hidden="true" tabindex="-1"></a><span class="co"># d</span></span>
+<span id="cb29-2"><a href="boot.html#cb29-2" aria-hidden="true" tabindex="-1"></a><span class="co"># Yes, but the bootstrap CI is more narrow.</span></span>
+<span id="cb29-3"><a href="boot.html#cb29-3" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb29-4"><a href="boot.html#cb29-4" aria-hidden="true" tabindex="-1"></a><span class="co"># e</span></span>
+<span id="cb29-5"><a href="boot.html#cb29-5" aria-hidden="true" tabindex="-1"></a><span class="co"># We just use the functions for Kendall/Spearman coefficients instead:</span></span>
+<span id="cb29-6"><a href="boot.html#cb29-6" aria-hidden="true" tabindex="-1"></a>T_kendall <span class="ot">&lt;-</span> <span class="cf">function</span>(x, y) {<span class="fu">cor</span>(x, y, <span class="at">method =</span> <span class="st">&quot;kendall&quot;</span>)}</span>
+<span id="cb29-7"><a href="boot.html#cb29-7" aria-hidden="true" tabindex="-1"></a>T_spearman <span class="ot">&lt;-</span> <span class="cf">function</span>(x, y) {<span class="fu">cor</span>(x, y, <span class="at">method =</span> <span class="st">&quot;spearman&quot;</span>)}</span>
+<span id="cb29-8"><a href="boot.html#cb29-8" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb29-9"><a href="boot.html#cb29-9" aria-hidden="true" tabindex="-1"></a><span class="co"># Put this in a function that returns the CI</span></span>
+<span id="cb29-10"><a href="boot.html#cb29-10" aria-hidden="true" tabindex="-1"></a>bootstrap_95_ci <span class="ot">&lt;-</span> <span class="cf">function</span>(x, y, t, <span class="at">m =</span> <span class="dv">1000</span>) {</span>
+<span id="cb29-11"><a href="boot.html#cb29-11" aria-hidden="true" tabindex="-1"></a>  n <span class="ot">&lt;-</span> <span class="fu">length</span>(x)</span>
+<span id="cb29-12"><a href="boot.html#cb29-12" aria-hidden="true" tabindex="-1"></a>  est_boot <span class="ot">&lt;-</span> <span class="fu">array</span>(<span class="cn">NA</span>, m)</span>
+<span id="cb29-13"><a href="boot.html#cb29-13" aria-hidden="true" tabindex="-1"></a>  <span class="cf">for</span> (i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>m) {</span>
+<span id="cb29-14"><a href="boot.html#cb29-14" aria-hidden="true" tabindex="-1"></a>    idx <span class="ot">&lt;-</span> <span class="fu">sample</span>(<span class="dv">1</span><span class="sc">:</span>n, n, <span class="at">rep =</span> T) <span class="co"># !!! important to use same indices to keep dependency between x and y</span></span>
+<span id="cb29-15"><a href="boot.html#cb29-15" aria-hidden="true" tabindex="-1"></a>    est_boot[i] <span class="ot">&lt;-</span> <span class="fu">t</span>(x[idx], y[idx])</span>
+<span id="cb29-16"><a href="boot.html#cb29-16" aria-hidden="true" tabindex="-1"></a>  }</span>
+<span id="cb29-17"><a href="boot.html#cb29-17" aria-hidden="true" tabindex="-1"></a>  <span class="fu">quantile</span>(est_boot, <span class="at">p =</span> <span class="fu">c</span>(<span class="fl">0.025</span>, <span class="fl">0.975</span>))</span>
+<span id="cb29-18"><a href="boot.html#cb29-18" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb29-19"><a href="boot.html#cb29-19" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb29-20"><a href="boot.html#cb29-20" aria-hidden="true" tabindex="-1"></a><span class="fu">bootstrap_95_ci</span>(x, y, T_kendall)</span></code></pre></div>
 <pre><code>##        2.5%       97.5% 
 ## -0.08108108  0.78378378</code></pre>
-<div class="sourceCode" id="cb213"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb213-1"><a href="boot.html#cb213-1" tabindex="-1"></a><span class="fu">bootstrap_95_ci</span>(x, y, T_spearman)</span></code></pre></div>
+<div class="sourceCode" id="cb31"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb31-1"><a href="boot.html#cb31-1" aria-hidden="true" tabindex="-1"></a><span class="fu">bootstrap_95_ci</span>(x, y, T_spearman)</span></code></pre></div>
 <pre><code>##       2.5%      97.5% 
 ## -0.1701115  0.8867925</code></pre>
 </div>
 <div class="exercise">
-<p><span id="exr:unnamed-chunk-229" class="exercise"><strong>Exercise 14.4  </strong></span><span style="color:blue">
+<p><span id="exr:unnamed-chunk-8" class="exercise"><strong>Exercise 14.4  </strong></span><span style="color:blue">
 In this problem we will illustrate the use of the nonparametric bootstrap for estimating CIs of regression model coefficients.
 </span></p>
 <ol style="list-style-type: lower-alpha">
@@ -626,15 +626,15 @@ <h1><span class="header-section-number">Chapter 14</span> Bootstrap<a href="boot
 </ol>
 </div>
 <div class="fold">
-<div class="sourceCode" id="cb215"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb215-1"><a href="boot.html#cb215-1" tabindex="-1"></a><span class="co"># a</span></span>
-<span id="cb215-2"><a href="boot.html#cb215-2" tabindex="-1"></a><span class="fu">data</span>(longley)</span>
-<span id="cb215-3"><a href="boot.html#cb215-3" tabindex="-1"></a></span>
-<span id="cb215-4"><a href="boot.html#cb215-4" tabindex="-1"></a><span class="co"># b</span></span>
-<span id="cb215-5"><a href="boot.html#cb215-5" tabindex="-1"></a>res <span class="ot">&lt;-</span> <span class="fu">lm</span>(Employed <span class="sc">~</span> . , longley)</span>
-<span id="cb215-6"><a href="boot.html#cb215-6" tabindex="-1"></a>tmp <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="fu">summary</span>(res)<span class="sc">$</span>coefficients[,<span class="dv">1</span><span class="sc">:</span><span class="dv">2</span>])</span>
-<span id="cb215-7"><a href="boot.html#cb215-7" tabindex="-1"></a>tmp<span class="sc">$</span>LB <span class="ot">&lt;-</span> tmp[,<span class="dv">1</span>] <span class="sc">-</span> <span class="fl">1.96</span> <span class="sc">*</span> tmp[,<span class="dv">2</span>]</span>
-<span id="cb215-8"><a href="boot.html#cb215-8" tabindex="-1"></a>tmp<span class="sc">$</span>UB <span class="ot">&lt;-</span> tmp[,<span class="dv">1</span>] <span class="sc">+</span> <span class="fl">1.96</span> <span class="sc">*</span> tmp[,<span class="dv">2</span>]</span>
-<span id="cb215-9"><a href="boot.html#cb215-9" tabindex="-1"></a>tmp</span></code></pre></div>
+<div class="sourceCode" id="cb33"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb33-1"><a href="boot.html#cb33-1" aria-hidden="true" tabindex="-1"></a><span class="co"># a</span></span>
+<span id="cb33-2"><a href="boot.html#cb33-2" aria-hidden="true" tabindex="-1"></a><span class="fu">data</span>(longley)</span>
+<span id="cb33-3"><a href="boot.html#cb33-3" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb33-4"><a href="boot.html#cb33-4" aria-hidden="true" tabindex="-1"></a><span class="co"># b</span></span>
+<span id="cb33-5"><a href="boot.html#cb33-5" aria-hidden="true" tabindex="-1"></a>res <span class="ot">&lt;-</span> <span class="fu">lm</span>(Employed <span class="sc">~</span> . , longley)</span>
+<span id="cb33-6"><a href="boot.html#cb33-6" aria-hidden="true" tabindex="-1"></a>tmp <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="fu">summary</span>(res)<span class="sc">$</span>coefficients[,<span class="dv">1</span><span class="sc">:</span><span class="dv">2</span>])</span>
+<span id="cb33-7"><a href="boot.html#cb33-7" aria-hidden="true" tabindex="-1"></a>tmp<span class="sc">$</span>LB <span class="ot">&lt;-</span> tmp[,<span class="dv">1</span>] <span class="sc">-</span> <span class="fl">1.96</span> <span class="sc">*</span> tmp[,<span class="dv">2</span>]</span>
+<span id="cb33-8"><a href="boot.html#cb33-8" aria-hidden="true" tabindex="-1"></a>tmp<span class="sc">$</span>UB <span class="ot">&lt;-</span> tmp[,<span class="dv">1</span>] <span class="sc">+</span> <span class="fl">1.96</span> <span class="sc">*</span> tmp[,<span class="dv">2</span>]</span>
+<span id="cb33-9"><a href="boot.html#cb33-9" aria-hidden="true" tabindex="-1"></a>tmp</span></code></pre></div>
 <pre><code>##                   Estimate   Std..Error            LB            UB
 ## (Intercept)  -3.482259e+03 8.904204e+02 -5.227483e+03 -1.737035e+03
 ## GNP.deflator  1.506187e-02 8.491493e-02 -1.513714e-01  1.814951e-01
@@ -643,37 +643,37 @@ <h1><span class="header-section-number">Chapter 14</span> Bootstrap<a href="boot
 ## Armed.Forces -1.033227e-02 2.142742e-03 -1.453204e-02 -6.132495e-03
 ## Population   -5.110411e-02 2.260732e-01 -4.942076e-01  3.919994e-01
 ## Year          1.829151e+00 4.554785e-01  9.364136e-01  2.721889e+00</code></pre>
-<div class="sourceCode" id="cb217"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb217-1"><a href="boot.html#cb217-1" tabindex="-1"></a><span class="co"># c</span></span>
-<span id="cb217-2"><a href="boot.html#cb217-2" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">0</span>)</span>
-<span id="cb217-3"><a href="boot.html#cb217-3" tabindex="-1"></a>m <span class="ot">&lt;-</span> <span class="dv">100</span></span>
-<span id="cb217-4"><a href="boot.html#cb217-4" tabindex="-1"></a>n <span class="ot">&lt;-</span> <span class="fu">nrow</span>(longley)</span>
-<span id="cb217-5"><a href="boot.html#cb217-5" tabindex="-1"></a>T_coef <span class="ot">&lt;-</span> <span class="cf">function</span>(x) {</span>
-<span id="cb217-6"><a href="boot.html#cb217-6" tabindex="-1"></a>  <span class="fu">lm</span>(Employed <span class="sc">~</span> . , x)<span class="sc">$</span>coefficients</span>
-<span id="cb217-7"><a href="boot.html#cb217-7" tabindex="-1"></a>}</span>
-<span id="cb217-8"><a href="boot.html#cb217-8" tabindex="-1"></a></span>
-<span id="cb217-9"><a href="boot.html#cb217-9" tabindex="-1"></a>est_boot <span class="ot">&lt;-</span> <span class="fu">array</span>(<span class="cn">NA</span>, <span class="fu">c</span>(m, <span class="fu">ncol</span>(longley)))</span>
-<span id="cb217-10"><a href="boot.html#cb217-10" tabindex="-1"></a><span class="cf">for</span> (i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>m) {</span>
-<span id="cb217-11"><a href="boot.html#cb217-11" tabindex="-1"></a>  idx <span class="ot">&lt;-</span> <span class="fu">sample</span>(<span class="dv">1</span><span class="sc">:</span>n, n, <span class="at">rep =</span> T)</span>
-<span id="cb217-12"><a href="boot.html#cb217-12" tabindex="-1"></a>  est_boot[i,] <span class="ot">&lt;-</span> <span class="fu">T_coef</span>(longley[idx,])</span>
-<span id="cb217-13"><a href="boot.html#cb217-13" tabindex="-1"></a>}</span>
-<span id="cb217-14"><a href="boot.html#cb217-14" tabindex="-1"></a></span>
-<span id="cb217-15"><a href="boot.html#cb217-15" tabindex="-1"></a>SE <span class="ot">&lt;-</span> <span class="fu">apply</span>(est_boot, <span class="dv">2</span>, sd)</span>
-<span id="cb217-16"><a href="boot.html#cb217-16" tabindex="-1"></a>SE</span></code></pre></div>
+<div class="sourceCode" id="cb35"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb35-1"><a href="boot.html#cb35-1" aria-hidden="true" tabindex="-1"></a><span class="co"># c</span></span>
+<span id="cb35-2"><a href="boot.html#cb35-2" aria-hidden="true" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">0</span>)</span>
+<span id="cb35-3"><a href="boot.html#cb35-3" aria-hidden="true" tabindex="-1"></a>m <span class="ot">&lt;-</span> <span class="dv">100</span></span>
+<span id="cb35-4"><a href="boot.html#cb35-4" aria-hidden="true" tabindex="-1"></a>n <span class="ot">&lt;-</span> <span class="fu">nrow</span>(longley)</span>
+<span id="cb35-5"><a href="boot.html#cb35-5" aria-hidden="true" tabindex="-1"></a>T_coef <span class="ot">&lt;-</span> <span class="cf">function</span>(x) {</span>
+<span id="cb35-6"><a href="boot.html#cb35-6" aria-hidden="true" tabindex="-1"></a>  <span class="fu">lm</span>(Employed <span class="sc">~</span> . , x)<span class="sc">$</span>coefficients</span>
+<span id="cb35-7"><a href="boot.html#cb35-7" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb35-8"><a href="boot.html#cb35-8" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb35-9"><a href="boot.html#cb35-9" aria-hidden="true" tabindex="-1"></a>est_boot <span class="ot">&lt;-</span> <span class="fu">array</span>(<span class="cn">NA</span>, <span class="fu">c</span>(m, <span class="fu">ncol</span>(longley)))</span>
+<span id="cb35-10"><a href="boot.html#cb35-10" aria-hidden="true" tabindex="-1"></a><span class="cf">for</span> (i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>m) {</span>
+<span id="cb35-11"><a href="boot.html#cb35-11" aria-hidden="true" tabindex="-1"></a>  idx <span class="ot">&lt;-</span> <span class="fu">sample</span>(<span class="dv">1</span><span class="sc">:</span>n, n, <span class="at">rep =</span> T)</span>
+<span id="cb35-12"><a href="boot.html#cb35-12" aria-hidden="true" tabindex="-1"></a>  est_boot[i,] <span class="ot">&lt;-</span> <span class="fu">T_coef</span>(longley[idx,])</span>
+<span id="cb35-13"><a href="boot.html#cb35-13" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb35-14"><a href="boot.html#cb35-14" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb35-15"><a href="boot.html#cb35-15" aria-hidden="true" tabindex="-1"></a>SE <span class="ot">&lt;-</span> <span class="fu">apply</span>(est_boot, <span class="dv">2</span>, sd)</span>
+<span id="cb35-16"><a href="boot.html#cb35-16" aria-hidden="true" tabindex="-1"></a>SE</span></code></pre></div>
 <pre><code>## [1] 1.826011e+03 1.605981e-01 5.693746e-02 8.204892e-03 3.802225e-03
 ## [6] 3.907527e-01 9.414436e-01</code></pre>
-<div class="sourceCode" id="cb219"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb219-1"><a href="boot.html#cb219-1" tabindex="-1"></a><span class="co"># Show the standard errors around coefficients</span></span>
-<span id="cb219-2"><a href="boot.html#cb219-2" tabindex="-1"></a><span class="fu">library</span>(ggplot2)</span>
-<span id="cb219-3"><a href="boot.html#cb219-3" tabindex="-1"></a><span class="fu">library</span>(reshape2)</span>
-<span id="cb219-4"><a href="boot.html#cb219-4" tabindex="-1"></a>df <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="at">index =</span> <span class="dv">1</span><span class="sc">:</span><span class="dv">7</span>, <span class="at">bootstrap_SE =</span> SE, <span class="at">lm_SE =</span> tmp<span class="sc">$</span>Std..Error)</span>
-<span id="cb219-5"><a href="boot.html#cb219-5" tabindex="-1"></a>melted_df <span class="ot">&lt;-</span> <span class="fu">melt</span>(df[<span class="dv">2</span><span class="sc">:</span><span class="fu">nrow</span>(df), ], <span class="at">id.vars =</span> <span class="st">&quot;index&quot;</span>)  <span class="co"># Ignore bias which has a really large magnitude</span></span>
-<span id="cb219-6"><a href="boot.html#cb219-6" tabindex="-1"></a><span class="fu">ggplot</span>(melted_df, <span class="fu">aes</span>(<span class="at">x =</span> index, <span class="at">y =</span> value, <span class="at">fill =</span> variable)) <span class="sc">+</span></span>
-<span id="cb219-7"><a href="boot.html#cb219-7" tabindex="-1"></a>  <span class="fu">geom_bar</span>(<span class="at">stat=</span><span class="st">&quot;identity&quot;</span>, <span class="at">position=</span><span class="st">&quot;dodge&quot;</span>) <span class="sc">+</span></span>
-<span id="cb219-8"><a href="boot.html#cb219-8" tabindex="-1"></a>  <span class="fu">xlab</span>(<span class="st">&quot;Coefficient&quot;</span>) <span class="sc">+</span></span>
-<span id="cb219-9"><a href="boot.html#cb219-9" tabindex="-1"></a>  <span class="fu">ylab</span>(<span class="st">&quot;Standard error&quot;</span>) <span class="co"># + scale_y_continuous(trans = &quot;log&quot;) # If you want to also plot bias</span></span></code></pre></div>
-<p><img src="bookdown-pou_files/figure-html/unnamed-chunk-230-1.png" width="672" /></p>
+<div class="sourceCode" id="cb37"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb37-1"><a href="boot.html#cb37-1" aria-hidden="true" tabindex="-1"></a><span class="co"># Show the standard errors around coefficients</span></span>
+<span id="cb37-2"><a href="boot.html#cb37-2" aria-hidden="true" tabindex="-1"></a><span class="fu">library</span>(ggplot2)</span>
+<span id="cb37-3"><a href="boot.html#cb37-3" aria-hidden="true" tabindex="-1"></a><span class="fu">library</span>(reshape2)</span>
+<span id="cb37-4"><a href="boot.html#cb37-4" aria-hidden="true" tabindex="-1"></a>df <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="at">index =</span> <span class="dv">1</span><span class="sc">:</span><span class="dv">7</span>, <span class="at">bootstrap_SE =</span> SE, <span class="at">lm_SE =</span> tmp<span class="sc">$</span>Std..Error)</span>
+<span id="cb37-5"><a href="boot.html#cb37-5" aria-hidden="true" tabindex="-1"></a>melted_df <span class="ot">&lt;-</span> <span class="fu">melt</span>(df[<span class="dv">2</span><span class="sc">:</span><span class="fu">nrow</span>(df), ], <span class="at">id.vars =</span> <span class="st">&quot;index&quot;</span>)  <span class="co"># Ignore bias which has a really large magnitude</span></span>
+<span id="cb37-6"><a href="boot.html#cb37-6" aria-hidden="true" tabindex="-1"></a><span class="fu">ggplot</span>(melted_df, <span class="fu">aes</span>(<span class="at">x =</span> index, <span class="at">y =</span> value, <span class="at">fill =</span> variable)) <span class="sc">+</span></span>
+<span id="cb37-7"><a href="boot.html#cb37-7" aria-hidden="true" tabindex="-1"></a>  <span class="fu">geom_bar</span>(<span class="at">stat=</span><span class="st">&quot;identity&quot;</span>, <span class="at">position=</span><span class="st">&quot;dodge&quot;</span>) <span class="sc">+</span></span>
+<span id="cb37-8"><a href="boot.html#cb37-8" aria-hidden="true" tabindex="-1"></a>  <span class="fu">xlab</span>(<span class="st">&quot;Coefficient&quot;</span>) <span class="sc">+</span></span>
+<span id="cb37-9"><a href="boot.html#cb37-9" aria-hidden="true" tabindex="-1"></a>  <span class="fu">ylab</span>(<span class="st">&quot;Standard error&quot;</span>) <span class="co"># + scale_y_continuous(trans = &quot;log&quot;) # If you want to also plot bias</span></span></code></pre></div>
+<p><img src="bookdown-pou_files/figure-html/unnamed-chunk-9-1.png" width="672" /></p>
 </div>
 <div class="exercise">
-<p><span id="exr:unnamed-chunk-231" class="exercise"><strong>Exercise 14.5  </strong></span><span style="color:blue">
+<p><span id="exr:unnamed-chunk-10" class="exercise"><strong>Exercise 14.5  </strong></span><span style="color:blue">
 This exercise shows a shortcoming of the bootstrap method when using the plug in estimator for the maximum.
 </span></p>
 <ol style="list-style-type: lower-alpha">
@@ -683,38 +683,310 @@ <h1><span class="header-section-number">Chapter 14</span> Bootstrap<a href="boot
 </ol>
 </div>
 <div class="fold">
-<div class="sourceCode" id="cb220"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb220-1"><a href="boot.html#cb220-1" tabindex="-1"></a><span class="co"># bootstrap CI for maximum</span></span>
-<span id="cb220-2"><a href="boot.html#cb220-2" tabindex="-1"></a></span>
-<span id="cb220-3"><a href="boot.html#cb220-3" tabindex="-1"></a>alpha <span class="ot">&lt;-</span> <span class="fl">0.05</span></span>
-<span id="cb220-4"><a href="boot.html#cb220-4" tabindex="-1"></a>T_max <span class="ot">&lt;-</span> <span class="cf">function</span>(x) {<span class="fu">max</span>(x)}  <span class="co"># Equal to T_max = max</span></span>
-<span id="cb220-5"><a href="boot.html#cb220-5" tabindex="-1"></a>bootstrap <span class="ot">&lt;-</span> <span class="cf">function</span>(x, t, <span class="at">m =</span> <span class="dv">1000</span>) {</span>
-<span id="cb220-6"><a href="boot.html#cb220-6" tabindex="-1"></a>  n <span class="ot">&lt;-</span> <span class="fu">length</span>(x)</span>
-<span id="cb220-7"><a href="boot.html#cb220-7" tabindex="-1"></a>  values <span class="ot">&lt;-</span> <span class="fu">rep</span>(<span class="dv">0</span>, m)</span>
-<span id="cb220-8"><a href="boot.html#cb220-8" tabindex="-1"></a>  <span class="cf">for</span> (i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>m) {</span>
-<span id="cb220-9"><a href="boot.html#cb220-9" tabindex="-1"></a>    values[i] <span class="ot">&lt;-</span> <span class="fu">t</span>(<span class="fu">sample</span>(x, n, <span class="at">replace =</span> T))</span>
-<span id="cb220-10"><a href="boot.html#cb220-10" tabindex="-1"></a>  }</span>
-<span id="cb220-11"><a href="boot.html#cb220-11" tabindex="-1"></a>  <span class="fu">quantile</span>(values, <span class="at">probs =</span> <span class="fu">c</span>(alpha <span class="sc">/</span> <span class="dv">2</span>, <span class="dv">1</span> <span class="sc">-</span> alpha <span class="sc">/</span> <span class="dv">2</span>))</span>
-<span id="cb220-12"><a href="boot.html#cb220-12" tabindex="-1"></a>}</span>
-<span id="cb220-13"><a href="boot.html#cb220-13" tabindex="-1"></a></span>
-<span id="cb220-14"><a href="boot.html#cb220-14" tabindex="-1"></a><span class="co"># a</span></span>
-<span id="cb220-15"><a href="boot.html#cb220-15" tabindex="-1"></a><span class="co"># Meaningless, as the normal distribution can yield arbitrarily large values.</span></span>
-<span id="cb220-16"><a href="boot.html#cb220-16" tabindex="-1"></a>x <span class="ot">&lt;-</span> <span class="fu">rnorm</span>(<span class="dv">100</span>)</span>
-<span id="cb220-17"><a href="boot.html#cb220-17" tabindex="-1"></a><span class="fu">bootstrap</span>(x, T_max)</span></code></pre></div>
+<div class="sourceCode" id="cb38"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb38-1"><a href="boot.html#cb38-1" aria-hidden="true" tabindex="-1"></a><span class="co"># bootstrap CI for maximum</span></span>
+<span id="cb38-2"><a href="boot.html#cb38-2" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb38-3"><a href="boot.html#cb38-3" aria-hidden="true" tabindex="-1"></a>alpha <span class="ot">&lt;-</span> <span class="fl">0.05</span></span>
+<span id="cb38-4"><a href="boot.html#cb38-4" aria-hidden="true" tabindex="-1"></a>T_max <span class="ot">&lt;-</span> <span class="cf">function</span>(x) {<span class="fu">max</span>(x)}  <span class="co"># Equal to T_max = max</span></span>
+<span id="cb38-5"><a href="boot.html#cb38-5" aria-hidden="true" tabindex="-1"></a>bootstrap <span class="ot">&lt;-</span> <span class="cf">function</span>(x, t, <span class="at">m =</span> <span class="dv">1000</span>) {</span>
+<span id="cb38-6"><a href="boot.html#cb38-6" aria-hidden="true" tabindex="-1"></a>  n <span class="ot">&lt;-</span> <span class="fu">length</span>(x)</span>
+<span id="cb38-7"><a href="boot.html#cb38-7" aria-hidden="true" tabindex="-1"></a>  values <span class="ot">&lt;-</span> <span class="fu">rep</span>(<span class="dv">0</span>, m)</span>
+<span id="cb38-8"><a href="boot.html#cb38-8" aria-hidden="true" tabindex="-1"></a>  <span class="cf">for</span> (i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>m) {</span>
+<span id="cb38-9"><a href="boot.html#cb38-9" aria-hidden="true" tabindex="-1"></a>    values[i] <span class="ot">&lt;-</span> <span class="fu">t</span>(<span class="fu">sample</span>(x, n, <span class="at">replace =</span> T))</span>
+<span id="cb38-10"><a href="boot.html#cb38-10" aria-hidden="true" tabindex="-1"></a>  }</span>
+<span id="cb38-11"><a href="boot.html#cb38-11" aria-hidden="true" tabindex="-1"></a>  <span class="fu">quantile</span>(values, <span class="at">probs =</span> <span class="fu">c</span>(alpha <span class="sc">/</span> <span class="dv">2</span>, <span class="dv">1</span> <span class="sc">-</span> alpha <span class="sc">/</span> <span class="dv">2</span>))</span>
+<span id="cb38-12"><a href="boot.html#cb38-12" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb38-13"><a href="boot.html#cb38-13" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb38-14"><a href="boot.html#cb38-14" aria-hidden="true" tabindex="-1"></a><span class="co"># a</span></span>
+<span id="cb38-15"><a href="boot.html#cb38-15" aria-hidden="true" tabindex="-1"></a><span class="co"># Meaningless, as the normal distribution can yield arbitrarily large values.</span></span>
+<span id="cb38-16"><a href="boot.html#cb38-16" aria-hidden="true" tabindex="-1"></a>x <span class="ot">&lt;-</span> <span class="fu">rnorm</span>(<span class="dv">100</span>)</span>
+<span id="cb38-17"><a href="boot.html#cb38-17" aria-hidden="true" tabindex="-1"></a><span class="fu">bootstrap</span>(x, T_max)</span></code></pre></div>
 <pre><code>##     2.5%    97.5% 
 ## 1.819425 2.961743</code></pre>
-<div class="sourceCode" id="cb222"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb222-1"><a href="boot.html#cb222-1" tabindex="-1"></a><span class="co"># b</span></span>
-<span id="cb222-2"><a href="boot.html#cb222-2" tabindex="-1"></a>x <span class="ot">&lt;-</span> <span class="fu">rbinom</span>(<span class="dv">100</span>, <span class="at">size =</span> <span class="dv">15</span>, <span class="at">prob =</span> <span class="fl">0.2</span>) <span class="co"># min = 0, max = 15</span></span>
-<span id="cb222-3"><a href="boot.html#cb222-3" tabindex="-1"></a><span class="fu">bootstrap</span>(x, T_max)</span></code></pre></div>
+<div class="sourceCode" id="cb40"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb40-1"><a href="boot.html#cb40-1" aria-hidden="true" tabindex="-1"></a><span class="co"># b</span></span>
+<span id="cb40-2"><a href="boot.html#cb40-2" aria-hidden="true" tabindex="-1"></a>x <span class="ot">&lt;-</span> <span class="fu">rbinom</span>(<span class="dv">100</span>, <span class="at">size =</span> <span class="dv">15</span>, <span class="at">prob =</span> <span class="fl">0.2</span>) <span class="co"># min = 0, max = 15</span></span>
+<span id="cb40-3"><a href="boot.html#cb40-3" aria-hidden="true" tabindex="-1"></a><span class="fu">bootstrap</span>(x, T_max)</span></code></pre></div>
 <pre><code>##  2.5% 97.5% 
 ##     6     7</code></pre>
-<div class="sourceCode" id="cb224"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb224-1"><a href="boot.html#cb224-1" tabindex="-1"></a><span class="co"># c</span></span>
-<span id="cb224-2"><a href="boot.html#cb224-2" tabindex="-1"></a>x <span class="ot">&lt;-</span> <span class="fu">rbinom</span>(<span class="dv">100</span>, <span class="at">size =</span> <span class="dv">15</span>, <span class="at">prob =</span> <span class="fl">0.9</span>) <span class="co"># min = 0, max = 15</span></span>
-<span id="cb224-3"><a href="boot.html#cb224-3" tabindex="-1"></a><span class="fu">bootstrap</span>(x, T_max)</span></code></pre></div>
+<div class="sourceCode" id="cb42"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb42-1"><a href="boot.html#cb42-1" aria-hidden="true" tabindex="-1"></a><span class="co"># c</span></span>
+<span id="cb42-2"><a href="boot.html#cb42-2" aria-hidden="true" tabindex="-1"></a>x <span class="ot">&lt;-</span> <span class="fu">rbinom</span>(<span class="dv">100</span>, <span class="at">size =</span> <span class="dv">15</span>, <span class="at">prob =</span> <span class="fl">0.9</span>) <span class="co"># min = 0, max = 15</span></span>
+<span id="cb42-3"><a href="boot.html#cb42-3" aria-hidden="true" tabindex="-1"></a><span class="fu">bootstrap</span>(x, T_max)</span></code></pre></div>
 <pre><code>##  2.5% 97.5% 
 ##    15    15</code></pre>
-<div class="sourceCode" id="cb226"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb226-1"><a href="boot.html#cb226-1" tabindex="-1"></a><span class="co"># Observation: to estimate the maximum, we need sufficient probability mass near the maximum value the distribution can yield.</span></span>
-<span id="cb226-2"><a href="boot.html#cb226-2" tabindex="-1"></a><span class="co"># Using bootstrap is pointless when there is too little mass near the true maximum.</span></span>
-<span id="cb226-3"><a href="boot.html#cb226-3" tabindex="-1"></a><span class="co"># In general, bootstrap will fail when estimating the CI for the maximum.</span></span></code></pre></div>
+<div class="sourceCode" id="cb44"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb44-1"><a href="boot.html#cb44-1" aria-hidden="true" tabindex="-1"></a><span class="co"># Observation: to estimate the maximum, we need sufficient probability mass near the maximum value the distribution can yield.</span></span>
+<span id="cb44-2"><a href="boot.html#cb44-2" aria-hidden="true" tabindex="-1"></a><span class="co"># Using bootstrap is pointless when there is too little mass near the true maximum.</span></span>
+<span id="cb44-3"><a href="boot.html#cb44-3" aria-hidden="true" tabindex="-1"></a><span class="co"># In general, bootstrap will fail when estimating the CI for the maximum.</span></span></code></pre></div>
+</div>
+<div class="exercise">
+<p><span id="exr:unnamed-chunk-12" class="exercise"><strong>Exercise 14.6  (Practical - and fictional - coverage interval comparison) </strong></span>In this exercise, we investigate how different kinds of CI’s behave as we vary the number of measurements.</p>
+<p>The story behind the data: it’s 2025 and we’ve discovered that Slovenia has rich deposits of a rare mineral called Moustachium, which can be used to accelerate moustache growth. This mineral is highly sought, so the government has decided to contract two different companies to provide information on where to begin mining. Both companies investigated mining sites in each statistical region and gave their best estimate of the average Moustachium concentration in tonnes per square kilometer. The Data Science team has been called to estimate the uncertainty in these estimates and help avoid mining in the wrong region.</p>
+<p>Generate synthetic data with the script below:</p>
+<pre><code>set.seed(0)
+
+library(comprehenr)
+
+regions &lt;- c(&quot;pomurska&quot;, &quot;podravska&quot;, &quot;koroska&quot;, &quot;savinjska&quot;, &quot;zasavska&quot;, &quot;posavska&quot;, &quot;JV Slovenija&quot;, &quot;primorsko-notranjska&quot;, &quot;osrednjeslovenska&quot;, &quot;gorenjska&quot;, &quot;goriska&quot;, &quot;obalno-kraska&quot;)
+region_rates &lt;- seq(1.3, 2.3, length.out=length(regions))
+region_rates &lt;- region_rates[sample.int(length(regions), length(regions))]
+
+make_dataset &lt;- function(n_contractors) {
+    measurements &lt;- matrix(nrow=length(regions), ncol=n_contractors)
+    for (i in 1:length(regions)) {
+        measurements[i,] &lt;- rgamma(n_contractors, 5.0, region_rates[i])
+    }
+
+    df &lt;- data.frame(measurements)
+    row.names(df) &lt;- regions
+    names(df) &lt;- to_vec(for(i in 1:n_contractors) paste(&quot;Contractor&quot;, i))
+    return(df)
+}
+
+set.seed(0)
+df_2025 &lt;- make_dataset(2)
+
+set.seed(0)
+df_2027 &lt;- make_dataset(10)
+
+set.seed(0)
+df_2028 &lt;- make_dataset(100)
+
+set.seed(0)
+df_2029 &lt;- make_dataset(1000)
+
+saveRDS(df_2025, file=&quot;moustachium_2025.Rda&quot;)
+saveRDS(df_2027, file=&quot;moustachium_2027.Rda&quot;)
+saveRDS(df_2028, file=&quot;moustachium_2028.Rda&quot;)
+saveRDS(df_2029, file=&quot;moustachium_2029.Rda&quot;)</code></pre>
+<ol style="list-style-type: lower-alpha">
+<li><p><span style="color:blue">Estimate the average concentration for different regions.</span></p></li>
+<li><p><span style="color:blue">Estimate the average concentration uncertainty using 95% CI’s (asymptotic normality with biased and unbiased standard error, standard bootstrap CI, bootstrap percentile CI).</span></p></li>
+<li><p><span style="color:blue">Visualize uncertainties with a histogram and discuss the best location to start mining.</span></p></li>
+<li><p><span style="color:blue">The year is 2027 and the government has decided to contract 10 companies. Rerun the code with new measurements and discuss how CI’s change.</span></p></li>
+<li><p><span style="color:blue">Technological advancements in robotics have enabled site surveys on a massive scale. Repeat the last point for 100 surveyor robots in 2028 and 1000 surveyor robots in 2029.</span></p></li>
+</ol>
+</div>
+<div class="fold">
+<div class="sourceCode" id="cb46"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb46-1"><a href="boot.html#cb46-1" aria-hidden="true" tabindex="-1"></a><span class="fu">library</span>(ggplot2)</span>
+<span id="cb46-2"><a href="boot.html#cb46-2" aria-hidden="true" tabindex="-1"></a><span class="fu">library</span>(dplyr)</span>
+<span id="cb46-3"><a href="boot.html#cb46-3" aria-hidden="true" tabindex="-1"></a><span class="fu">library</span>(data.table)</span>
+<span id="cb46-4"><a href="boot.html#cb46-4" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb46-5"><a href="boot.html#cb46-5" aria-hidden="true" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">0</span>)</span>
+<span id="cb46-6"><a href="boot.html#cb46-6" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb46-7"><a href="boot.html#cb46-7" aria-hidden="true" tabindex="-1"></a>input_dataset_path <span class="ot">=</span> <span class="st">&quot;moustachium_2025.Rda&quot;</span>  <span class="co"># Change this for points d and e</span></span>
+<span id="cb46-8"><a href="boot.html#cb46-8" aria-hidden="true" tabindex="-1"></a>output_plot_path <span class="ot">=</span> <span class="st">&quot;moustachium_2025.pdf&quot;</span>  <span class="co"># Change this for points d and e</span></span>
+<span id="cb46-9"><a href="boot.html#cb46-9" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb46-10"><a href="boot.html#cb46-10" aria-hidden="true" tabindex="-1"></a>df <span class="ot">&lt;-</span> <span class="fu">readRDS</span>(input_dataset_path)  <span class="co"># Data comes from here</span></span>
+<span id="cb46-11"><a href="boot.html#cb46-11" aria-hidden="true" tabindex="-1"></a>n_contractors <span class="ot">&lt;-</span> <span class="fu">ncol</span>(df)</span>
+<span id="cb46-12"><a href="boot.html#cb46-12" aria-hidden="true" tabindex="-1"></a>results_df <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="at">region=</span><span class="fu">row.names</span>(df))  <span class="co"># Store CI bounds here</span></span>
+<span id="cb46-13"><a href="boot.html#cb46-13" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb46-14"><a href="boot.html#cb46-14" aria-hidden="true" tabindex="-1"></a><span class="co"># 1. average concentration for different mining sites</span></span>
+<span id="cb46-15"><a href="boot.html#cb46-15" aria-hidden="true" tabindex="-1"></a>results_df<span class="sc">$</span>average_concetration <span class="ot">&lt;-</span> <span class="fu">rowMeans</span>(df)</span>
+<span id="cb46-16"><a href="boot.html#cb46-16" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb46-17"><a href="boot.html#cb46-17" aria-hidden="true" tabindex="-1"></a><span class="co"># CI for the mean based on asymptotic normality (biased SE estimate)</span></span>
+<span id="cb46-18"><a href="boot.html#cb46-18" aria-hidden="true" tabindex="-1"></a>biased_SE <span class="ot">&lt;-</span> <span class="fu">sqrt</span>(<span class="fu">apply</span>(df, <span class="dv">1</span>, <span class="cf">function</span>(vec) {<span class="fu">sum</span>((vec <span class="sc">-</span> <span class="fu">mean</span>(vec))<span class="sc">^</span><span class="dv">2</span>) <span class="sc">/</span> <span class="fu">length</span>(vec)}) <span class="sc">/</span> n_contractors)</span>
+<span id="cb46-19"><a href="boot.html#cb46-19" aria-hidden="true" tabindex="-1"></a>results_df<span class="sc">$</span>ci95.an.biased_var.low <span class="ot">&lt;-</span> results_df<span class="sc">$</span>average_concetration <span class="sc">-</span> <span class="fl">1.96</span> <span class="sc">*</span> biased_SE</span>
+<span id="cb46-20"><a href="boot.html#cb46-20" aria-hidden="true" tabindex="-1"></a>results_df<span class="sc">$</span>ci95.an.biased_var.high <span class="ot">&lt;-</span> results_df<span class="sc">$</span>average_concetration <span class="sc">+</span> <span class="fl">1.96</span> <span class="sc">*</span> biased_SE</span>
+<span id="cb46-21"><a href="boot.html#cb46-21" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb46-22"><a href="boot.html#cb46-22" aria-hidden="true" tabindex="-1"></a><span class="co"># CI for the mean based on asymptotic normality (unbiased SE estimate)</span></span>
+<span id="cb46-23"><a href="boot.html#cb46-23" aria-hidden="true" tabindex="-1"></a>unbiased_SE <span class="ot">&lt;-</span> <span class="fu">sqrt</span>(<span class="fu">apply</span>(df, <span class="dv">1</span>, var) <span class="sc">/</span> n_contractors)</span>
+<span id="cb46-24"><a href="boot.html#cb46-24" aria-hidden="true" tabindex="-1"></a>results_df<span class="sc">$</span>ci95.an.unbiased_var.low <span class="ot">&lt;-</span> results_df<span class="sc">$</span>average_concetration <span class="sc">-</span> <span class="fl">1.96</span> <span class="sc">*</span> unbiased_SE</span>
+<span id="cb46-25"><a href="boot.html#cb46-25" aria-hidden="true" tabindex="-1"></a>results_df<span class="sc">$</span>ci95.an.unbiased_var.high <span class="ot">&lt;-</span> results_df<span class="sc">$</span>average_concetration <span class="sc">+</span> <span class="fl">1.96</span> <span class="sc">*</span> unbiased_SE</span>
+<span id="cb46-26"><a href="boot.html#cb46-26" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb46-27"><a href="boot.html#cb46-27" aria-hidden="true" tabindex="-1"></a><span class="co"># Standard bootstrap CI with 1000 samples</span></span>
+<span id="cb46-28"><a href="boot.html#cb46-28" aria-hidden="true" tabindex="-1"></a>bootstrap_variance <span class="ot">&lt;-</span> <span class="cf">function</span>(data, n_samples) {</span>
+<span id="cb46-29"><a href="boot.html#cb46-29" aria-hidden="true" tabindex="-1"></a>  <span class="co"># n_samples is m in pseudocode</span></span>
+<span id="cb46-30"><a href="boot.html#cb46-30" aria-hidden="true" tabindex="-1"></a>  output <span class="ot">&lt;-</span> <span class="fu">numeric</span>(n_samples)</span>
+<span id="cb46-31"><a href="boot.html#cb46-31" aria-hidden="true" tabindex="-1"></a>  <span class="cf">for</span> (i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>n_samples) {</span>
+<span id="cb46-32"><a href="boot.html#cb46-32" aria-hidden="true" tabindex="-1"></a>    index <span class="ot">&lt;-</span> <span class="fu">sample</span>(<span class="dv">1</span><span class="sc">:</span><span class="fu">length</span>(data), <span class="fu">length</span>(data), <span class="at">rep =</span> <span class="cn">TRUE</span>)</span>
+<span id="cb46-33"><a href="boot.html#cb46-33" aria-hidden="true" tabindex="-1"></a>    resampled_data <span class="ot">&lt;-</span> data[index]</span>
+<span id="cb46-34"><a href="boot.html#cb46-34" aria-hidden="true" tabindex="-1"></a>    output[i] <span class="ot">&lt;-</span> <span class="fu">mean</span>(resampled_data)</span>
+<span id="cb46-35"><a href="boot.html#cb46-35" aria-hidden="true" tabindex="-1"></a>  }</span>
+<span id="cb46-36"><a href="boot.html#cb46-36" aria-hidden="true" tabindex="-1"></a>  <span class="fu">return</span>(<span class="fu">var</span>(output))</span>
+<span id="cb46-37"><a href="boot.html#cb46-37" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb46-38"><a href="boot.html#cb46-38" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb46-39"><a href="boot.html#cb46-39" aria-hidden="true" tabindex="-1"></a>bootstrap_1000_sd <span class="ot">&lt;-</span> <span class="fu">sqrt</span>(<span class="fu">apply</span>(df, <span class="dv">1</span>, <span class="cf">function</span>(vec){<span class="fu">bootstrap_variance</span>(vec, <span class="dv">1000</span>)}))</span>
+<span id="cb46-40"><a href="boot.html#cb46-40" aria-hidden="true" tabindex="-1"></a>results_df<span class="sc">$</span>ci95.bootstrap.standard.<span class="fl">1000.</span>low <span class="ot">&lt;-</span> results_df<span class="sc">$</span>average_concetration <span class="sc">-</span> <span class="fl">1.96</span> <span class="sc">*</span> bootstrap_1000_sd</span>
+<span id="cb46-41"><a href="boot.html#cb46-41" aria-hidden="true" tabindex="-1"></a>results_df<span class="sc">$</span>ci95.bootstrap.standard.<span class="fl">1000.</span>high <span class="ot">&lt;-</span> results_df<span class="sc">$</span>average_concetration <span class="sc">+</span> <span class="fl">1.96</span> <span class="sc">*</span> bootstrap_1000_sd</span>
+<span id="cb46-42"><a href="boot.html#cb46-42" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb46-43"><a href="boot.html#cb46-43" aria-hidden="true" tabindex="-1"></a><span class="co"># Bootstrap percentile CI with 1000 samples</span></span>
+<span id="cb46-44"><a href="boot.html#cb46-44" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb46-45"><a href="boot.html#cb46-45" aria-hidden="true" tabindex="-1"></a>bootstrap_quantile <span class="ot">&lt;-</span> <span class="cf">function</span>(data, functional, n_samples, probs) {</span>
+<span id="cb46-46"><a href="boot.html#cb46-46" aria-hidden="true" tabindex="-1"></a>    <span class="co"># n_samples is m in pseudocode</span></span>
+<span id="cb46-47"><a href="boot.html#cb46-47" aria-hidden="true" tabindex="-1"></a>    output <span class="ot">&lt;-</span> <span class="fu">numeric</span>(n_samples)</span>
+<span id="cb46-48"><a href="boot.html#cb46-48" aria-hidden="true" tabindex="-1"></a>    <span class="cf">for</span> (i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>n_samples) {</span>
+<span id="cb46-49"><a href="boot.html#cb46-49" aria-hidden="true" tabindex="-1"></a>        index <span class="ot">&lt;-</span> <span class="fu">sample</span>(<span class="dv">1</span><span class="sc">:</span><span class="fu">length</span>(data), <span class="fu">length</span>(data), <span class="at">rep =</span> <span class="cn">TRUE</span>)</span>
+<span id="cb46-50"><a href="boot.html#cb46-50" aria-hidden="true" tabindex="-1"></a>        resampled_data <span class="ot">&lt;-</span> data[index]</span>
+<span id="cb46-51"><a href="boot.html#cb46-51" aria-hidden="true" tabindex="-1"></a>        output[i] <span class="ot">&lt;-</span> <span class="fu">functional</span>(resampled_data)</span>
+<span id="cb46-52"><a href="boot.html#cb46-52" aria-hidden="true" tabindex="-1"></a>    }</span>
+<span id="cb46-53"><a href="boot.html#cb46-53" aria-hidden="true" tabindex="-1"></a>    <span class="fu">return</span>(<span class="fu">quantile</span>(output, <span class="at">probs=</span>probs))</span>
+<span id="cb46-54"><a href="boot.html#cb46-54" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb46-55"><a href="boot.html#cb46-55" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb46-56"><a href="boot.html#cb46-56" aria-hidden="true" tabindex="-1"></a>results_df<span class="sc">$</span>ci95.bootstrap.percentile.<span class="fl">1000.</span>low <span class="ot">&lt;-</span> <span class="fu">apply</span>(df, <span class="dv">1</span>, <span class="cf">function</span>(vec){<span class="fu">bootstrap_quantile</span>(vec, mean, <span class="dv">1000</span>, <span class="fl">0.025</span>)})</span>
+<span id="cb46-57"><a href="boot.html#cb46-57" aria-hidden="true" tabindex="-1"></a>results_df<span class="sc">$</span>ci95.bootstrap.percentile.<span class="fl">1000.</span>high <span class="ot">&lt;-</span> <span class="fu">apply</span>(df, <span class="dv">1</span>, <span class="cf">function</span>(vec){<span class="fu">bootstrap_quantile</span>(vec, mean, <span class="dv">1000</span>, <span class="fl">0.975</span>)})</span>
+<span id="cb46-58"><a href="boot.html#cb46-58" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb46-59"><a href="boot.html#cb46-59" aria-hidden="true" tabindex="-1"></a>results_df</span></code></pre></div>
+<pre><code>##                  region average_concetration ci95.an.biased_var.low
+## 1              pomurska             2.814731              1.5351811
+## 2             podravska             2.646518              1.5358919
+## 3               koroska             2.010216              0.5956186
+## 4             savinjska             4.618001              4.4057369
+## 5              zasavska             2.458873              2.0050840
+## 6              posavska             2.153802              1.9001244
+## 7          JV Slovenija             2.433503              1.6860397
+## 8  primorsko-notranjska             3.165394              2.9640430
+## 9     osrednjeslovenska             3.696875              3.5592419
+## 10            gorenjska             1.341931              0.2784547
+## 11              goriska             2.767328              2.3255569
+## 12        obalno-kraska             1.580711              1.4533751
+##    ci95.an.biased_var.high ci95.an.unbiased_var.low ci95.an.unbiased_var.high
+## 1                 4.094281              1.005174095                  4.624288
+## 2                 3.757144              1.075855548                  4.217180
+## 3                 3.424813              0.009673183                  4.010759
+## 4                 4.830264              4.317814385                  4.918187
+## 5                 2.912662              1.817118318                  3.100628
+## 6                 2.407479              1.795047746                  2.512556
+## 7                 3.180965              1.376430415                  3.490575
+## 8                 3.366746              2.880640556                  3.450148
+## 9                 3.834508              3.502232367                  3.891518
+## 10                2.405407             -0.162051549                  2.845913
+## 11                3.209099              2.142569481                  3.392086
+## 12                1.708047              1.400630772                  1.760792
+##    ci95.bootstrap.standard.1000.low ci95.bootstrap.standard.1000.high
+## 1                         1.5397542                          4.089708
+## 2                         1.5388631                          3.754173
+## 3                         0.5492603                          3.471171
+## 4                         4.4062860                          4.829715
+## 5                         1.9938049                          2.923942
+## 6                         1.9010514                          2.406552
+## 7                         1.6932573                          3.173748
+## 8                         2.9670216                          3.363767
+## 9                         3.5602064                          3.833544
+## 10                        0.2845999                          2.399262
+## 11                        2.3293359                          3.205320
+## 12                        1.4543352                          1.707087
+##    ci95.bootstrap.percentile.1000.low ci95.bootstrap.percentile.1000.high
+## 1                           1.8914878                            3.737975
+## 2                           1.8451596                            3.447876
+## 3                           0.9895308                            3.030901
+## 4                           4.4648444                            4.771157
+## 5                           2.1314473                            2.786299
+## 6                           1.9707640                            2.336840
+## 7                           1.8941800                            2.972825
+## 8                           3.0201118                            3.310677
+## 9                           3.5975676                            3.796183
+## 10                          0.5745928                            2.109269
+## 11                          2.4485735                            3.086082
+## 12                          1.4888334                            1.672589</code></pre>
+<div class="sourceCode" id="cb48"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb48-1"><a href="boot.html#cb48-1" aria-hidden="true" tabindex="-1"></a><span class="co"># Visualization: we use a bar chart with uncertainty bands</span></span>
+<span id="cb48-2"><a href="boot.html#cb48-2" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb48-3"><a href="boot.html#cb48-3" aria-hidden="true" tabindex="-1"></a>plot_moustachium_per_region <span class="ot">&lt;-</span> <span class="cf">function</span>(region_names, average, ci_low, ci_high) {</span>
+<span id="cb48-4"><a href="boot.html#cb48-4" aria-hidden="true" tabindex="-1"></a>    df_visualization <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="at">region=</span>region_names, <span class="at">average=</span>average, <span class="at">low=</span>ci_low, <span class="at">high=</span>ci_high)</span>
+<span id="cb48-5"><a href="boot.html#cb48-5" aria-hidden="true" tabindex="-1"></a>    <span class="fu">ggplot</span>(df_visualization, <span class="fu">aes</span>(<span class="at">x=</span>region, <span class="at">y=</span>average)) <span class="sc">+</span> <span class="fu">geom_bar</span>(<span class="at">stat=</span><span class="st">&quot;identity&quot;</span>)</span>
+<span id="cb48-6"><a href="boot.html#cb48-6" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb48-7"><a href="boot.html#cb48-7" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb48-8"><a href="boot.html#cb48-8" aria-hidden="true" tabindex="-1"></a>mask <span class="ot">&lt;-</span> <span class="fu">endsWith</span>(<span class="fu">colnames</span>(results_df), <span class="st">&quot;low&quot;</span>)</span>
+<span id="cb48-9"><a href="boot.html#cb48-9" aria-hidden="true" tabindex="-1"></a>mask[<span class="fu">c</span>(<span class="dv">1</span>, <span class="dv">2</span>)] <span class="ot">&lt;-</span> T</span>
+<span id="cb48-10"><a href="boot.html#cb48-10" aria-hidden="true" tabindex="-1"></a>results_df_low <span class="ot">&lt;-</span> results_df[, mask]</span>
+<span id="cb48-11"><a href="boot.html#cb48-11" aria-hidden="true" tabindex="-1"></a><span class="fu">colnames</span>(results_df_low) <span class="ot">&lt;-</span> <span class="fu">gsub</span>(<span class="st">&#39;.low&#39;</span>,<span class="st">&#39;&#39;</span>, <span class="fu">colnames</span>(results_df_low))</span>
+<span id="cb48-12"><a href="boot.html#cb48-12" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb48-13"><a href="boot.html#cb48-13" aria-hidden="true" tabindex="-1"></a>mask <span class="ot">&lt;-</span> <span class="fu">endsWith</span>(<span class="fu">colnames</span>(results_df), <span class="st">&quot;high&quot;</span>)</span>
+<span id="cb48-14"><a href="boot.html#cb48-14" aria-hidden="true" tabindex="-1"></a>mask[<span class="fu">c</span>(<span class="dv">1</span>, <span class="dv">2</span>)] <span class="ot">&lt;-</span> T</span>
+<span id="cb48-15"><a href="boot.html#cb48-15" aria-hidden="true" tabindex="-1"></a>results_df_high <span class="ot">&lt;-</span> results_df[, mask]</span>
+<span id="cb48-16"><a href="boot.html#cb48-16" aria-hidden="true" tabindex="-1"></a><span class="fu">colnames</span>(results_df_high) <span class="ot">&lt;-</span> <span class="fu">gsub</span>(<span class="st">&#39;.high&#39;</span>,<span class="st">&#39;&#39;</span>, <span class="fu">colnames</span>(results_df_high))</span>
+<span id="cb48-17"><a href="boot.html#cb48-17" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb48-18"><a href="boot.html#cb48-18" aria-hidden="true" tabindex="-1"></a>long_results_df_low <span class="ot">&lt;-</span> <span class="fu">melt</span>(<span class="fu">setDT</span>(results_df_low), <span class="at">id.vars=</span><span class="fu">c</span>(<span class="st">&quot;region&quot;</span>, <span class="st">&quot;average_concetration&quot;</span>))</span>
+<span id="cb48-19"><a href="boot.html#cb48-19" aria-hidden="true" tabindex="-1"></a><span class="fu">names</span>(long_results_df_low) <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="st">&quot;region&quot;</span>, <span class="st">&quot;average_concentration&quot;</span>, <span class="st">&quot;variable&quot;</span>, <span class="st">&quot;low&quot;</span>)</span>
+<span id="cb48-20"><a href="boot.html#cb48-20" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb48-21"><a href="boot.html#cb48-21" aria-hidden="true" tabindex="-1"></a>long_results_df_high <span class="ot">&lt;-</span> <span class="fu">melt</span>(<span class="fu">setDT</span>(results_df_high), <span class="at">id.vars=</span><span class="fu">c</span>(<span class="st">&quot;region&quot;</span>, <span class="st">&quot;average_concetration&quot;</span>))</span>
+<span id="cb48-22"><a href="boot.html#cb48-22" aria-hidden="true" tabindex="-1"></a><span class="fu">names</span>(long_results_df_high) <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="st">&quot;region&quot;</span>, <span class="st">&quot;average_concentration&quot;</span>, <span class="st">&quot;variable&quot;</span>, <span class="st">&quot;high&quot;</span>)</span>
+<span id="cb48-23"><a href="boot.html#cb48-23" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb48-24"><a href="boot.html#cb48-24" aria-hidden="true" tabindex="-1"></a>long_results_df <span class="ot">&lt;-</span> <span class="fu">merge</span>(long_results_df_low, long_results_df_high, <span class="at">by=</span><span class="fu">c</span>(<span class="st">&quot;region&quot;</span>, <span class="st">&quot;variable&quot;</span>, <span class="st">&quot;average_concentration&quot;</span>), <span class="at">all=</span>T)</span>
+<span id="cb48-25"><a href="boot.html#cb48-25" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb48-26"><a href="boot.html#cb48-26" aria-hidden="true" tabindex="-1"></a>moustachium_plot <span class="ot">&lt;-</span> <span class="fu">ggplot</span>(long_results_df, <span class="fu">aes</span>(<span class="at">x=</span>region, <span class="at">y=</span>average_concentration)) <span class="sc">+</span></span>
+<span id="cb48-27"><a href="boot.html#cb48-27" aria-hidden="true" tabindex="-1"></a>    <span class="fu">geom_bar</span>(<span class="at">stat=</span><span class="st">&quot;identity&quot;</span>, <span class="at">position=</span><span class="st">&quot;dodge&quot;</span>, <span class="at">alpha=</span><span class="fl">0.2</span>) <span class="sc">+</span></span>
+<span id="cb48-28"><a href="boot.html#cb48-28" aria-hidden="true" tabindex="-1"></a>    <span class="fu">geom_errorbar</span>(<span class="fu">aes</span>(<span class="at">ymin=</span>low, <span class="at">ymax=</span>high, <span class="at">color=</span>variable), <span class="at">width=</span><span class="fl">0.2</span>, <span class="at">position=</span><span class="fu">position_dodge</span>(<span class="fl">0.9</span>)) <span class="sc">+</span></span>
+<span id="cb48-29"><a href="boot.html#cb48-29" aria-hidden="true" tabindex="-1"></a>    <span class="fu">scale_x_discrete</span>(<span class="at">guide =</span> <span class="fu">guide_axis</span>(<span class="at">angle =</span> <span class="dv">45</span>)) <span class="sc">+</span></span>
+<span id="cb48-30"><a href="boot.html#cb48-30" aria-hidden="true" tabindex="-1"></a>    <span class="fu">ylim</span>(<span class="sc">-</span><span class="dv">1</span>, <span class="dv">8</span>)</span>
+<span id="cb48-31"><a href="boot.html#cb48-31" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb48-32"><a href="boot.html#cb48-32" aria-hidden="true" tabindex="-1"></a><span class="co"># ggsave(plot=moustachium_plot, width=12, height=8, dpi=300, filename=output_plot_path)</span></span>
+<span id="cb48-33"><a href="boot.html#cb48-33" aria-hidden="true" tabindex="-1"></a>moustachium_plot</span></code></pre></div>
+<p><img src="bookdown-pou_files/figure-html/unnamed-chunk-13-1.png" width="672" /></p>
+<div class="sourceCode" id="cb49"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb49-1"><a href="boot.html#cb49-1" aria-hidden="true" tabindex="-1"></a><span class="co"># Visualization: we can also use a map. Circle size denotes concentration in region, low transparency denotes high uncertainty.</span></span>
+<span id="cb49-2"><a href="boot.html#cb49-2" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb49-3"><a href="boot.html#cb49-3" aria-hidden="true" tabindex="-1"></a><span class="fu">library</span>(maps)</span>
+<span id="cb49-4"><a href="boot.html#cb49-4" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb49-5"><a href="boot.html#cb49-5" aria-hidden="true" tabindex="-1"></a>map_data_slo <span class="ot">&lt;-</span> <span class="fu">map_data</span>(<span class="st">&#39;world&#39;</span>)[<span class="fu">map_data</span>(<span class="st">&#39;world&#39;</span>)<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;Slovenia&quot;</span>,]</span>
+<span id="cb49-6"><a href="boot.html#cb49-6" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb49-7"><a href="boot.html#cb49-7" aria-hidden="true" tabindex="-1"></a>map_df <span class="ot">&lt;-</span> long_results_df[long_results_df<span class="sc">$</span>variable <span class="sc">==</span> <span class="st">&quot;ci95.an.biased_var&quot;</span>, ]</span>
+<span id="cb49-8"><a href="boot.html#cb49-8" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb49-9"><a href="boot.html#cb49-9" aria-hidden="true" tabindex="-1"></a><span class="co"># VERY approximate longitudes and latitudes for different regions.</span></span>
+<span id="cb49-10"><a href="boot.html#cb49-10" aria-hidden="true" tabindex="-1"></a>map_df<span class="sc">$</span>long <span class="ot">&lt;-</span> <span class="fu">rep</span>(<span class="dv">0</span>, <span class="fu">nrow</span>(map_df))</span>
+<span id="cb49-11"><a href="boot.html#cb49-11" aria-hidden="true" tabindex="-1"></a>map_df<span class="sc">$</span>lat <span class="ot">&lt;-</span> <span class="fu">rep</span>(<span class="dv">0</span>, <span class="fu">nrow</span>(map_df))</span>
+<span id="cb49-12"><a href="boot.html#cb49-12" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb49-13"><a href="boot.html#cb49-13" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;gorenjska&quot;</span>]<span class="sc">$</span>long <span class="ot">&lt;-</span> <span class="fl">14.2</span></span>
+<span id="cb49-14"><a href="boot.html#cb49-14" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;gorenjska&quot;</span>]<span class="sc">$</span>lat <span class="ot">&lt;-</span> <span class="fl">46.3</span></span>
+<span id="cb49-15"><a href="boot.html#cb49-15" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb49-16"><a href="boot.html#cb49-16" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;goriska&quot;</span>]<span class="sc">$</span>long <span class="ot">&lt;-</span> <span class="fl">13.85</span></span>
+<span id="cb49-17"><a href="boot.html#cb49-17" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;goriska&quot;</span>]<span class="sc">$</span>lat <span class="ot">&lt;-</span> <span class="fl">46.0</span></span>
+<span id="cb49-18"><a href="boot.html#cb49-18" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb49-19"><a href="boot.html#cb49-19" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;obalno-kraska&quot;</span>]<span class="sc">$</span>long <span class="ot">&lt;-</span> <span class="fl">13.9</span></span>
+<span id="cb49-20"><a href="boot.html#cb49-20" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;obalno-kraska&quot;</span>]<span class="sc">$</span>lat <span class="ot">&lt;-</span> <span class="fl">45.65</span></span>
+<span id="cb49-21"><a href="boot.html#cb49-21" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb49-22"><a href="boot.html#cb49-22" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;osrednjeslovenska&quot;</span>]<span class="sc">$</span>long <span class="ot">&lt;-</span> <span class="fl">14.5</span></span>
+<span id="cb49-23"><a href="boot.html#cb49-23" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;osrednjeslovenska&quot;</span>]<span class="sc">$</span>lat <span class="ot">&lt;-</span> <span class="fl">46.</span></span>
+<span id="cb49-24"><a href="boot.html#cb49-24" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb49-25"><a href="boot.html#cb49-25" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;primorsko-notranjska&quot;</span>]<span class="sc">$</span>long <span class="ot">&lt;-</span> <span class="fl">14.3</span></span>
+<span id="cb49-26"><a href="boot.html#cb49-26" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;primorsko-notranjska&quot;</span>]<span class="sc">$</span>lat <span class="ot">&lt;-</span> <span class="fl">45.7</span></span>
+<span id="cb49-27"><a href="boot.html#cb49-27" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb49-28"><a href="boot.html#cb49-28" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;zasavska&quot;</span>]<span class="sc">$</span>long <span class="ot">&lt;-</span> <span class="dv">15</span></span>
+<span id="cb49-29"><a href="boot.html#cb49-29" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;zasavska&quot;</span>]<span class="sc">$</span>lat <span class="ot">&lt;-</span> <span class="fl">46.1</span></span>
+<span id="cb49-30"><a href="boot.html#cb49-30" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb49-31"><a href="boot.html#cb49-31" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;savinjska&quot;</span>]<span class="sc">$</span>long <span class="ot">&lt;-</span> <span class="fl">15.2</span></span>
+<span id="cb49-32"><a href="boot.html#cb49-32" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;savinjska&quot;</span>]<span class="sc">$</span>lat <span class="ot">&lt;-</span> <span class="fl">46.25</span></span>
+<span id="cb49-33"><a href="boot.html#cb49-33" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb49-34"><a href="boot.html#cb49-34" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;posavska&quot;</span>]<span class="sc">$</span>long <span class="ot">&lt;-</span> <span class="fl">15.4</span></span>
+<span id="cb49-35"><a href="boot.html#cb49-35" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;posavska&quot;</span>]<span class="sc">$</span>lat <span class="ot">&lt;-</span> <span class="dv">46</span></span>
+<span id="cb49-36"><a href="boot.html#cb49-36" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb49-37"><a href="boot.html#cb49-37" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;koroska&quot;</span>]<span class="sc">$</span>long <span class="ot">&lt;-</span> <span class="fl">15.1</span></span>
+<span id="cb49-38"><a href="boot.html#cb49-38" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;koroska&quot;</span>]<span class="sc">$</span>lat <span class="ot">&lt;-</span> <span class="fl">46.5</span></span>
+<span id="cb49-39"><a href="boot.html#cb49-39" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb49-40"><a href="boot.html#cb49-40" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;podravska&quot;</span>]<span class="sc">$</span>long <span class="ot">&lt;-</span> <span class="fl">15.7</span></span>
+<span id="cb49-41"><a href="boot.html#cb49-41" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;podravska&quot;</span>]<span class="sc">$</span>lat <span class="ot">&lt;-</span> <span class="fl">46.45</span></span>
+<span id="cb49-42"><a href="boot.html#cb49-42" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb49-43"><a href="boot.html#cb49-43" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;pomurska&quot;</span>]<span class="sc">$</span>long <span class="ot">&lt;-</span> <span class="fl">16.2</span></span>
+<span id="cb49-44"><a href="boot.html#cb49-44" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;pomurska&quot;</span>]<span class="sc">$</span>lat <span class="ot">&lt;-</span> <span class="fl">46.65</span></span>
+<span id="cb49-45"><a href="boot.html#cb49-45" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb49-46"><a href="boot.html#cb49-46" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;JV Slovenija&quot;</span>]<span class="sc">$</span>long <span class="ot">&lt;-</span> <span class="fl">15.</span></span>
+<span id="cb49-47"><a href="boot.html#cb49-47" aria-hidden="true" tabindex="-1"></a>map_df[map_df<span class="sc">$</span>region <span class="sc">==</span> <span class="st">&quot;JV Slovenija&quot;</span>]<span class="sc">$</span>lat <span class="ot">&lt;-</span> <span class="fl">45.7</span></span>
+<span id="cb49-48"><a href="boot.html#cb49-48" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb49-49"><a href="boot.html#cb49-49" aria-hidden="true" tabindex="-1"></a>map_df<span class="sc">$</span>ci_size <span class="ot">&lt;-</span> (map_df<span class="sc">$</span>high <span class="sc">-</span> map_df<span class="sc">$</span>low)</span>
+<span id="cb49-50"><a href="boot.html#cb49-50" aria-hidden="true" tabindex="-1"></a>map_df<span class="sc">$</span>ci_y <span class="ot">&lt;-</span> map_df<span class="sc">$</span>lat <span class="sc">-</span> <span class="fl">0.05</span></span>
+<span id="cb49-51"><a href="boot.html#cb49-51" aria-hidden="true" tabindex="-1"></a>map_df<span class="sc">$</span>ci_label <span class="ot">&lt;-</span> <span class="fu">sprintf</span>(<span class="st">&quot;(%.2f, %.2f)&quot;</span>, map_df<span class="sc">$</span>low, map_df<span class="sc">$</span>high)</span>
+<span id="cb49-52"><a href="boot.html#cb49-52" aria-hidden="true" tabindex="-1"></a>map_df<span class="sc">$</span>avg_label <span class="ot">&lt;-</span> <span class="fu">sprintf</span>(<span class="st">&quot;%.2f&quot;</span>, map_df<span class="sc">$</span>average_concentration)</span>
+<span id="cb49-53"><a href="boot.html#cb49-53" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb49-54"><a href="boot.html#cb49-54" aria-hidden="true" tabindex="-1"></a>country_plot <span class="ot">&lt;-</span> <span class="fu">ggplot</span>() <span class="sc">+</span></span>
+<span id="cb49-55"><a href="boot.html#cb49-55" aria-hidden="true" tabindex="-1"></a>    <span class="co"># First layer: worldwide map</span></span>
+<span id="cb49-56"><a href="boot.html#cb49-56" aria-hidden="true" tabindex="-1"></a>    <span class="fu">geom_polygon</span>(<span class="at">data =</span> <span class="fu">map_data</span>(<span class="st">&quot;world&quot;</span>),</span>
+<span id="cb49-57"><a href="boot.html#cb49-57" aria-hidden="true" tabindex="-1"></a>                 <span class="fu">aes</span>(<span class="at">x=</span>long, <span class="at">y=</span>lat, <span class="at">group =</span> group),</span>
+<span id="cb49-58"><a href="boot.html#cb49-58" aria-hidden="true" tabindex="-1"></a>                 <span class="at">color =</span> <span class="st">&#39;#9c9c9c&#39;</span>, <span class="at">fill =</span> <span class="st">&#39;#f3f3f3&#39;</span>) <span class="sc">+</span></span>
+<span id="cb49-59"><a href="boot.html#cb49-59" aria-hidden="true" tabindex="-1"></a>    <span class="co"># Second layer: Country map</span></span>
+<span id="cb49-60"><a href="boot.html#cb49-60" aria-hidden="true" tabindex="-1"></a>    <span class="fu">geom_polygon</span>(</span>
+<span id="cb49-61"><a href="boot.html#cb49-61" aria-hidden="true" tabindex="-1"></a>        <span class="at">data =</span> map_data_slo,</span>
+<span id="cb49-62"><a href="boot.html#cb49-62" aria-hidden="true" tabindex="-1"></a>        <span class="fu">aes</span>(<span class="at">x=</span>long, <span class="at">y=</span>lat, <span class="at">group =</span> group),</span>
+<span id="cb49-63"><a href="boot.html#cb49-63" aria-hidden="true" tabindex="-1"></a>        <span class="at">color=</span><span class="st">&#39;darkgreen&#39;</span>, </span>
+<span id="cb49-64"><a href="boot.html#cb49-64" aria-hidden="true" tabindex="-1"></a>        <span class="at">fill=</span><span class="st">&#39;green&#39;</span>, </span>
+<span id="cb49-65"><a href="boot.html#cb49-65" aria-hidden="true" tabindex="-1"></a>        <span class="at">alpha=</span><span class="fl">0.2</span></span>
+<span id="cb49-66"><a href="boot.html#cb49-66" aria-hidden="true" tabindex="-1"></a>    ) <span class="sc">+</span></span>
+<span id="cb49-67"><a href="boot.html#cb49-67" aria-hidden="true" tabindex="-1"></a>    <span class="fu">geom_point</span>(<span class="at">data=</span>map_df, <span class="fu">aes</span>(<span class="at">x=</span>long, <span class="at">y=</span>lat, <span class="at">fill=</span>region, <span class="at">size=</span>average_concentration, <span class="at">alpha=</span>ci_size), <span class="at">color=</span><span class="st">&quot;black&quot;</span>, <span class="at">pch=</span><span class="dv">21</span>) <span class="sc">+</span></span>
+<span id="cb49-68"><a href="boot.html#cb49-68" aria-hidden="true" tabindex="-1"></a>    <span class="fu">geom_text</span>(<span class="at">data=</span>map_df, <span class="fu">aes</span>(<span class="at">x=</span>long, <span class="at">y=</span>ci_y, <span class="at">label=</span>ci_label), <span class="at">size=</span><span class="dv">3</span>) <span class="sc">+</span></span>
+<span id="cb49-69"><a href="boot.html#cb49-69" aria-hidden="true" tabindex="-1"></a>    <span class="fu">geom_text</span>(<span class="at">data=</span>map_df, <span class="fu">aes</span>(<span class="at">x=</span>long, <span class="at">y=</span>lat, <span class="at">label=</span>avg_label), <span class="at">size=</span><span class="dv">3</span>) <span class="sc">+</span></span>
+<span id="cb49-70"><a href="boot.html#cb49-70" aria-hidden="true" tabindex="-1"></a>    <span class="fu">scale_size_continuous</span>(<span class="at">range =</span> <span class="fu">c</span>(<span class="dv">3</span>, <span class="dv">12</span>), <span class="at">trans =</span> <span class="st">&quot;exp&quot;</span>) <span class="sc">+</span></span>
+<span id="cb49-71"><a href="boot.html#cb49-71" aria-hidden="true" tabindex="-1"></a>    <span class="fu">scale_alpha_continuous</span>(<span class="at">range =</span> <span class="fu">c</span>(<span class="fl">0.15</span>, <span class="fl">0.75</span>), <span class="at">trans =</span> <span class="st">&quot;reverse&quot;</span>) <span class="sc">+</span></span>
+<span id="cb49-72"><a href="boot.html#cb49-72" aria-hidden="true" tabindex="-1"></a>    <span class="fu">ggtitle</span>(<span class="st">&quot;Estimated average Moustachium concentration with 95% CI&quot;</span>) <span class="sc">+</span></span>
+<span id="cb49-73"><a href="boot.html#cb49-73" aria-hidden="true" tabindex="-1"></a>    <span class="fu">coord_cartesian</span>(<span class="at">xlim=</span><span class="fu">c</span>(<span class="fl">13.2</span>, <span class="fl">16.7</span>), <span class="at">ylim=</span><span class="fu">c</span>(<span class="fl">45.4</span>, <span class="fl">47.</span>))</span>
+<span id="cb49-74"><a href="boot.html#cb49-74" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb49-75"><a href="boot.html#cb49-75" aria-hidden="true" tabindex="-1"></a><span class="co"># ggsave(plot=country_plot, width=18, height=12, dpi=300, filename=&quot;country.pdf&quot;)</span></span>
+<span id="cb49-76"><a href="boot.html#cb49-76" aria-hidden="true" tabindex="-1"></a>country_plot</span></code></pre></div>
+<p><img src="bookdown-pou_files/figure-html/unnamed-chunk-13-2.png" width="672" /></p>
 </div>
 
 </div>
diff --git a/docs/ml.html b/docs/ml.html
index b30e532..19f47b7 100644
--- a/docs/ml.html
+++ b/docs/ml.html
@@ -6,7 +6,7 @@
   <meta http-equiv="X-UA-Compatible" content="IE=edge" />
   <title>Chapter 15 Maximum likelihood | Principles of Uncertainty – exercises</title>
   <meta name="description" content="Course notes" />
-  <meta name="generator" content="bookdown 0.35 and GitBook 2.6.7" />
+  <meta name="generator" content="bookdown 0.37 and GitBook 2.6.7" />
 
   <meta property="og:title" content="Chapter 15 Maximum likelihood | Principles of Uncertainty – exercises" />
   <meta property="og:type" content="book" />
@@ -23,7 +23,7 @@
 <meta name="author" content="Gregor Pirš, Erik Štrumbelj, David Nabergoj and Leon Hvastja" />
 
 
-<meta name="date" content="2023-10-02" />
+<meta name="date" content="2024-01-11" />
 
   <meta name="viewport" content="width=device-width, initial-scale=1" />
   <meta name="apple-mobile-web-app-capable" content="yes" />
@@ -332,15 +332,15 @@ <h1><span class="header-section-number">Chapter 15</span> Maximum likelihood<a h
 <div id="deriving-mle" class="section level2 hasAnchor" number="15.1">
 <h2><span class="header-section-number">15.1</span> Deriving MLE<a href="ml.html#deriving-mle" class="anchor-section" aria-label="Anchor link to header"></a></h2>
 <div class="exercise">
-<p><span id="exr:unnamed-chunk-234" class="exercise"><strong>Exercise 15.1  </strong></span></p>
+<p><span id="exr:unnamed-chunk-2" class="exercise"><strong>Exercise 15.1  </strong></span></p>
 <ol style="list-style-type: lower-alpha">
 <li>Derive the maximum likelihood estimator of variance for N<span class="math inline">\((\mu, \sigma^2)\)</span>.</li>
-<li>Compare with results from <a href="eb.html#exr:cbest">13.3</a>. What does that say about the MLE estimator?</li>
+<li>Compare with results from <a href="#exr:cbest"><strong>??</strong></a>. What does that say about the MLE estimator?</li>
 </ol>
 </div>
 <div class="fold">
 <div class="solution">
-<p><span id="unlabeled-div-88" class="solution"><em>Solution</em>. </span></p>
+<p><span id="unlabeled-div-1" class="solution"><em>Solution</em>. </span></p>
 <ol style="list-style-type: lower-alpha">
 <li><p>The mean is assumed constant, so we have the likelihood
 <span class="math display">\[\begin{align}
@@ -369,7 +369,7 @@ <h2><span class="header-section-number">15.1</span> Deriving MLE<a href="ml.html
 </div>
 </div>
 <div class="exercise">
-<p><span id="exr:unnamed-chunk-236" class="exercise"><strong>Exercise 15.2  (Multivariate normal distribution) </strong></span></p>
+<p><span id="exr:unnamed-chunk-4" class="exercise"><strong>Exercise 15.2  (Multivariate normal distribution) </strong></span></p>
 <ol style="list-style-type: lower-alpha">
 <li><p>Derive the maximum likelihood estimate for the mean and covariance matrix of the multivariate normal.</p></li>
 <li><p><span style="color:blue">Simulate <span class="math inline">\(n = 40\)</span> samples from a bivariate normal distribution (choose non-trivial parameters, that is, mean <span class="math inline">\(\neq 0\)</span> and covariance <span class="math inline">\(\neq 0\)</span>). Compute the MLE for the sample. Overlay the data with an ellipse that is determined by the MLE and an ellipse that is determined by the chosen true parameters.</span></p></li>
@@ -379,7 +379,7 @@ <h2><span class="header-section-number">15.1</span> Deriving MLE<a href="ml.html
 </div>
 <div class="fold">
 <div class="solution">
-<p><span id="unlabeled-div-89" class="solution"><em>Solution</em>. </span>The log likelihood of the MVN distribution is
+<p><span id="unlabeled-div-2" class="solution"><em>Solution</em>. </span>The log likelihood of the MVN distribution is
 <span class="math display">\[\begin{align*}
   l(\mu, \Sigma ; x) &amp;= -\frac{1}{2}\Big(\sum_{i=1}^n k\ln(2\pi) + |\Sigma| + (x_i - \mu)^T \Sigma^{-1} (x_i - \mu)\Big) \\
     &amp;= -\frac{n}{2}\ln|\Sigma| + -\frac{1}{2}\Big(\sum_{i=1}^n(x_i - \mu)^T \Sigma^{-1} (x_i - \mu)\Big) + c,
@@ -408,33 +408,33 @@ <h2><span class="header-section-number">15.1</span> Deriving MLE<a href="ml.html
   \hat{\Sigma} = \frac{1}{n}\sum_{i=1}^n (x_i - \mu) (x_i - \mu)^T.
 \end{align*}\]</span></p>
 </div>
-<div class="sourceCode" id="cb227"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb227-1"><a href="ml.html#cb227-1" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">1</span>)</span>
-<span id="cb227-2"><a href="ml.html#cb227-2" tabindex="-1"></a>n     <span class="ot">&lt;-</span> <span class="dv">40</span></span>
-<span id="cb227-3"><a href="ml.html#cb227-3" tabindex="-1"></a>mu    <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">1</span>, <span class="sc">-</span><span class="dv">2</span>)</span>
-<span id="cb227-4"><a href="ml.html#cb227-4" tabindex="-1"></a>Sigma <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="at">data =</span> <span class="fu">c</span>(<span class="dv">2</span>, <span class="sc">-</span><span class="fl">1.6</span>, <span class="sc">-</span><span class="fl">1.6</span>, <span class="fl">1.8</span>), <span class="at">ncol =</span> <span class="dv">2</span>)</span>
-<span id="cb227-5"><a href="ml.html#cb227-5" tabindex="-1"></a>X     <span class="ot">&lt;-</span> <span class="fu">mvrnorm</span>(<span class="at">n =</span> n, <span class="at">mu =</span> mu, <span class="at">Sigma =</span> Sigma)</span>
-<span id="cb227-6"><a href="ml.html#cb227-6" tabindex="-1"></a><span class="fu">colnames</span>(X) <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="st">&quot;X1&quot;</span>, <span class="st">&quot;X2&quot;</span>)</span>
-<span id="cb227-7"><a href="ml.html#cb227-7" tabindex="-1"></a>X     <span class="ot">&lt;-</span> <span class="fu">as.data.frame</span>(X)</span>
-<span id="cb227-8"><a href="ml.html#cb227-8" tabindex="-1"></a></span>
-<span id="cb227-9"><a href="ml.html#cb227-9" tabindex="-1"></a><span class="co"># plot.new()</span></span>
-<span id="cb227-10"><a href="ml.html#cb227-10" tabindex="-1"></a>tru_ellip <span class="ot">&lt;-</span> <span class="fu">ellipse</span>(mu, Sigma, <span class="at">draw =</span> <span class="cn">FALSE</span>)</span>
-<span id="cb227-11"><a href="ml.html#cb227-11" tabindex="-1"></a><span class="fu">colnames</span>(tru_ellip) <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="st">&quot;X1&quot;</span>, <span class="st">&quot;X2&quot;</span>)</span>
-<span id="cb227-12"><a href="ml.html#cb227-12" tabindex="-1"></a>tru_ellip <span class="ot">&lt;-</span> <span class="fu">as.data.frame</span>(tru_ellip)</span>
-<span id="cb227-13"><a href="ml.html#cb227-13" tabindex="-1"></a></span>
-<span id="cb227-14"><a href="ml.html#cb227-14" tabindex="-1"></a>mu_est    <span class="ot">&lt;-</span> <span class="fu">apply</span>(X, <span class="dv">2</span>, mean)</span>
-<span id="cb227-15"><a href="ml.html#cb227-15" tabindex="-1"></a>tmp       <span class="ot">&lt;-</span> <span class="fu">as.matrix</span>(<span class="fu">sweep</span>(X, <span class="dv">2</span>, mu_est))</span>
-<span id="cb227-16"><a href="ml.html#cb227-16" tabindex="-1"></a>Sigma_est <span class="ot">&lt;-</span> (<span class="dv">1</span> <span class="sc">/</span> n) <span class="sc">*</span> <span class="fu">t</span>(tmp) <span class="sc">%*%</span> tmp</span>
-<span id="cb227-17"><a href="ml.html#cb227-17" tabindex="-1"></a></span>
-<span id="cb227-18"><a href="ml.html#cb227-18" tabindex="-1"></a>est_ellip <span class="ot">&lt;-</span> <span class="fu">ellipse</span>(mu_est, Sigma_est, <span class="at">draw =</span> <span class="cn">FALSE</span>)</span>
-<span id="cb227-19"><a href="ml.html#cb227-19" tabindex="-1"></a><span class="fu">colnames</span>(est_ellip) <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="st">&quot;X1&quot;</span>, <span class="st">&quot;X2&quot;</span>)</span>
-<span id="cb227-20"><a href="ml.html#cb227-20" tabindex="-1"></a>est_ellip <span class="ot">&lt;-</span> <span class="fu">as.data.frame</span>(est_ellip)</span>
-<span id="cb227-21"><a href="ml.html#cb227-21" tabindex="-1"></a></span>
-<span id="cb227-22"><a href="ml.html#cb227-22" tabindex="-1"></a><span class="fu">ggplot</span>(<span class="at">data =</span> X, <span class="fu">aes</span>(<span class="at">x =</span> X1, <span class="at">y =</span> X2)) <span class="sc">+</span></span>
-<span id="cb227-23"><a href="ml.html#cb227-23" tabindex="-1"></a>  <span class="fu">geom_point</span>() <span class="sc">+</span></span>
-<span id="cb227-24"><a href="ml.html#cb227-24" tabindex="-1"></a>  <span class="fu">geom_path</span>(<span class="at">data =</span> tru_ellip, <span class="fu">aes</span>(<span class="at">x =</span> X1, <span class="at">y =</span> X2, <span class="at">color =</span> <span class="st">&quot;truth&quot;</span>)) <span class="sc">+</span></span>
-<span id="cb227-25"><a href="ml.html#cb227-25" tabindex="-1"></a>  <span class="fu">geom_path</span>(<span class="at">data =</span> est_ellip, <span class="fu">aes</span>(<span class="at">x =</span> X1, <span class="at">y =</span> X2, <span class="at">color =</span> <span class="st">&quot;estimated&quot;</span>)) <span class="sc">+</span></span>
-<span id="cb227-26"><a href="ml.html#cb227-26" tabindex="-1"></a>  <span class="fu">labs</span>(<span class="at">color =</span> <span class="st">&quot;type&quot;</span>)</span></code></pre></div>
-<p><img src="bookdown-pou_files/figure-html/unnamed-chunk-238-1.png" width="672" /></p>
+<div class="sourceCode" id="cb1"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb1-1"><a href="ml.html#cb1-1" aria-hidden="true" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">1</span>)</span>
+<span id="cb1-2"><a href="ml.html#cb1-2" aria-hidden="true" tabindex="-1"></a>n     <span class="ot">&lt;-</span> <span class="dv">40</span></span>
+<span id="cb1-3"><a href="ml.html#cb1-3" aria-hidden="true" tabindex="-1"></a>mu    <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">1</span>, <span class="sc">-</span><span class="dv">2</span>)</span>
+<span id="cb1-4"><a href="ml.html#cb1-4" aria-hidden="true" tabindex="-1"></a>Sigma <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="at">data =</span> <span class="fu">c</span>(<span class="dv">2</span>, <span class="sc">-</span><span class="fl">1.6</span>, <span class="sc">-</span><span class="fl">1.6</span>, <span class="fl">1.8</span>), <span class="at">ncol =</span> <span class="dv">2</span>)</span>
+<span id="cb1-5"><a href="ml.html#cb1-5" aria-hidden="true" tabindex="-1"></a>X     <span class="ot">&lt;-</span> <span class="fu">mvrnorm</span>(<span class="at">n =</span> n, <span class="at">mu =</span> mu, <span class="at">Sigma =</span> Sigma)</span>
+<span id="cb1-6"><a href="ml.html#cb1-6" aria-hidden="true" tabindex="-1"></a><span class="fu">colnames</span>(X) <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="st">&quot;X1&quot;</span>, <span class="st">&quot;X2&quot;</span>)</span>
+<span id="cb1-7"><a href="ml.html#cb1-7" aria-hidden="true" tabindex="-1"></a>X     <span class="ot">&lt;-</span> <span class="fu">as.data.frame</span>(X)</span>
+<span id="cb1-8"><a href="ml.html#cb1-8" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb1-9"><a href="ml.html#cb1-9" aria-hidden="true" tabindex="-1"></a><span class="co"># plot.new()</span></span>
+<span id="cb1-10"><a href="ml.html#cb1-10" aria-hidden="true" tabindex="-1"></a>tru_ellip <span class="ot">&lt;-</span> <span class="fu">ellipse</span>(mu, Sigma, <span class="at">draw =</span> <span class="cn">FALSE</span>)</span>
+<span id="cb1-11"><a href="ml.html#cb1-11" aria-hidden="true" tabindex="-1"></a><span class="fu">colnames</span>(tru_ellip) <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="st">&quot;X1&quot;</span>, <span class="st">&quot;X2&quot;</span>)</span>
+<span id="cb1-12"><a href="ml.html#cb1-12" aria-hidden="true" tabindex="-1"></a>tru_ellip <span class="ot">&lt;-</span> <span class="fu">as.data.frame</span>(tru_ellip)</span>
+<span id="cb1-13"><a href="ml.html#cb1-13" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb1-14"><a href="ml.html#cb1-14" aria-hidden="true" tabindex="-1"></a>mu_est    <span class="ot">&lt;-</span> <span class="fu">apply</span>(X, <span class="dv">2</span>, mean)</span>
+<span id="cb1-15"><a href="ml.html#cb1-15" aria-hidden="true" tabindex="-1"></a>tmp       <span class="ot">&lt;-</span> <span class="fu">as.matrix</span>(<span class="fu">sweep</span>(X, <span class="dv">2</span>, mu_est))</span>
+<span id="cb1-16"><a href="ml.html#cb1-16" aria-hidden="true" tabindex="-1"></a>Sigma_est <span class="ot">&lt;-</span> (<span class="dv">1</span> <span class="sc">/</span> n) <span class="sc">*</span> <span class="fu">t</span>(tmp) <span class="sc">%*%</span> tmp</span>
+<span id="cb1-17"><a href="ml.html#cb1-17" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb1-18"><a href="ml.html#cb1-18" aria-hidden="true" tabindex="-1"></a>est_ellip <span class="ot">&lt;-</span> <span class="fu">ellipse</span>(mu_est, Sigma_est, <span class="at">draw =</span> <span class="cn">FALSE</span>)</span>
+<span id="cb1-19"><a href="ml.html#cb1-19" aria-hidden="true" tabindex="-1"></a><span class="fu">colnames</span>(est_ellip) <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="st">&quot;X1&quot;</span>, <span class="st">&quot;X2&quot;</span>)</span>
+<span id="cb1-20"><a href="ml.html#cb1-20" aria-hidden="true" tabindex="-1"></a>est_ellip <span class="ot">&lt;-</span> <span class="fu">as.data.frame</span>(est_ellip)</span>
+<span id="cb1-21"><a href="ml.html#cb1-21" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb1-22"><a href="ml.html#cb1-22" aria-hidden="true" tabindex="-1"></a><span class="fu">ggplot</span>(<span class="at">data =</span> X, <span class="fu">aes</span>(<span class="at">x =</span> X1, <span class="at">y =</span> X2)) <span class="sc">+</span></span>
+<span id="cb1-23"><a href="ml.html#cb1-23" aria-hidden="true" tabindex="-1"></a>  <span class="fu">geom_point</span>() <span class="sc">+</span></span>
+<span id="cb1-24"><a href="ml.html#cb1-24" aria-hidden="true" tabindex="-1"></a>  <span class="fu">geom_path</span>(<span class="at">data =</span> tru_ellip, <span class="fu">aes</span>(<span class="at">x =</span> X1, <span class="at">y =</span> X2, <span class="at">color =</span> <span class="st">&quot;truth&quot;</span>)) <span class="sc">+</span></span>
+<span id="cb1-25"><a href="ml.html#cb1-25" aria-hidden="true" tabindex="-1"></a>  <span class="fu">geom_path</span>(<span class="at">data =</span> est_ellip, <span class="fu">aes</span>(<span class="at">x =</span> X1, <span class="at">y =</span> X2, <span class="at">color =</span> <span class="st">&quot;estimated&quot;</span>)) <span class="sc">+</span></span>
+<span id="cb1-26"><a href="ml.html#cb1-26" aria-hidden="true" tabindex="-1"></a>  <span class="fu">labs</span>(<span class="at">color =</span> <span class="st">&quot;type&quot;</span>)</span></code></pre></div>
+<p><img src="bookdown-pou_files/figure-html/unnamed-chunk-6-1.png" width="672" /></p>
 </div>
 <div class="exercise">
 <p><span id="exr:logisticmle" class="exercise"><strong>Exercise 15.3  (Logistic regression) </strong></span>Logistic regression is a popular discriminative model when our target variable is binary (categorical with 2 values). One of the ways of looking at logistic regression is that it is linear regression but instead of using the linear term as the mean of a normal RV, we use it as the mean of a Bernoulli RV. Of course, the mean of a Bernoulli is bounded on <span class="math inline">\([0,1]\)</span>, so, to avoid non-sensical values, we squeeze the linear between 0 and 1 with the inverse logit function inv_logit<span class="math inline">\((z) = 1 / (1 + e^{-z})\)</span>. This leads to the following model: <span class="math inline">\(y_i | \beta, x_i \sim \text{Bernoulli}(\text{inv_logit}(\beta x_i))\)</span>.</p>
@@ -445,62 +445,62 @@ <h2><span class="header-section-number">15.1</span> Deriving MLE<a href="ml.html
 <li><p>Let <span class="math inline">\(y2\)</span> be a response defined below. Will logistic regression work well on this dataset? Why not? How can we still use the model, without changing it?</p></li>
 </ol>
 </div>
-<div class="sourceCode" id="cb228"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb228-1"><a href="ml.html#cb228-1" tabindex="-1"></a>inv_log <span class="ot">&lt;-</span> <span class="cf">function</span> (z) {</span>
-<span id="cb228-2"><a href="ml.html#cb228-2" tabindex="-1"></a>  <span class="fu">return</span> (<span class="dv">1</span> <span class="sc">/</span> (<span class="dv">1</span> <span class="sc">+</span> <span class="fu">exp</span>(<span class="sc">-</span>z)))</span>
-<span id="cb228-3"><a href="ml.html#cb228-3" tabindex="-1"></a>}</span>
-<span id="cb228-4"><a href="ml.html#cb228-4" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">1</span>)</span>
-<span id="cb228-5"><a href="ml.html#cb228-5" tabindex="-1"></a>x  <span class="ot">&lt;-</span> <span class="fu">rnorm</span>(<span class="dv">100</span>)</span>
-<span id="cb228-6"><a href="ml.html#cb228-6" tabindex="-1"></a>y  <span class="ot">&lt;-</span> <span class="fu">rbinom</span>(<span class="dv">100</span>, <span class="at">size =</span> <span class="dv">1</span>, <span class="at">prob =</span> <span class="fu">inv_log</span>(<span class="fl">1.2</span> <span class="sc">*</span> x))</span>
-<span id="cb228-7"><a href="ml.html#cb228-7" tabindex="-1"></a>y2 <span class="ot">&lt;-</span> <span class="fu">rbinom</span>(<span class="dv">100</span>, <span class="at">size =</span> <span class="dv">1</span>, <span class="at">prob =</span> <span class="fu">inv_log</span>(<span class="fl">1.2</span> <span class="sc">*</span> x <span class="sc">+</span> <span class="fl">1.4</span> <span class="sc">*</span> x<span class="sc">^</span><span class="dv">2</span>))</span></code></pre></div>
+<div class="sourceCode" id="cb2"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb2-1"><a href="ml.html#cb2-1" aria-hidden="true" tabindex="-1"></a>inv_log <span class="ot">&lt;-</span> <span class="cf">function</span> (z) {</span>
+<span id="cb2-2"><a href="ml.html#cb2-2" aria-hidden="true" tabindex="-1"></a>  <span class="fu">return</span> (<span class="dv">1</span> <span class="sc">/</span> (<span class="dv">1</span> <span class="sc">+</span> <span class="fu">exp</span>(<span class="sc">-</span>z)))</span>
+<span id="cb2-3"><a href="ml.html#cb2-3" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb2-4"><a href="ml.html#cb2-4" aria-hidden="true" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">1</span>)</span>
+<span id="cb2-5"><a href="ml.html#cb2-5" aria-hidden="true" tabindex="-1"></a>x  <span class="ot">&lt;-</span> <span class="fu">rnorm</span>(<span class="dv">100</span>)</span>
+<span id="cb2-6"><a href="ml.html#cb2-6" aria-hidden="true" tabindex="-1"></a>y  <span class="ot">&lt;-</span> <span class="fu">rbinom</span>(<span class="dv">100</span>, <span class="at">size =</span> <span class="dv">1</span>, <span class="at">prob =</span> <span class="fu">inv_log</span>(<span class="fl">1.2</span> <span class="sc">*</span> x))</span>
+<span id="cb2-7"><a href="ml.html#cb2-7" aria-hidden="true" tabindex="-1"></a>y2 <span class="ot">&lt;-</span> <span class="fu">rbinom</span>(<span class="dv">100</span>, <span class="at">size =</span> <span class="dv">1</span>, <span class="at">prob =</span> <span class="fu">inv_log</span>(<span class="fl">1.2</span> <span class="sc">*</span> x <span class="sc">+</span> <span class="fl">1.4</span> <span class="sc">*</span> x<span class="sc">^</span><span class="dv">2</span>))</span></code></pre></div>
 <div class="fold">
 <div class="solution">
-<p><span id="unlabeled-div-90" class="solution"><em>Solution</em>. </span><span class="math display">\[\begin{align*}
+<p><span id="unlabeled-div-3" class="solution"><em>Solution</em>. </span><span class="math display">\[\begin{align*}
   l(\beta; x, y) &amp;= p(y | x, \beta) \\
     &amp;= \ln(\prod_{i=1}^n \text{inv_logit}(\beta x_i)^{y_i} (1 - \text{inv_logit}(\beta x_i))^{1 - y_i}) \\
     &amp;= \sum_{i=1}^n y_i \ln(\text{inv_logit}(\beta x_i)) + (1 - y_i) \ln(1 - \text{inv_logit}(\beta x_i)).
 \end{align*}\]</span></p>
 </div>
-<div class="sourceCode" id="cb229"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb229-1"><a href="ml.html#cb229-1" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">1</span>)</span>
-<span id="cb229-2"><a href="ml.html#cb229-2" tabindex="-1"></a>inv_log <span class="ot">&lt;-</span> <span class="cf">function</span> (z) {</span>
-<span id="cb229-3"><a href="ml.html#cb229-3" tabindex="-1"></a>  <span class="fu">return</span> (<span class="dv">1</span> <span class="sc">/</span> (<span class="dv">1</span> <span class="sc">+</span> <span class="fu">exp</span>(<span class="sc">-</span>z)))</span>
-<span id="cb229-4"><a href="ml.html#cb229-4" tabindex="-1"></a>}</span>
-<span id="cb229-5"><a href="ml.html#cb229-5" tabindex="-1"></a></span>
-<span id="cb229-6"><a href="ml.html#cb229-6" tabindex="-1"></a>x <span class="ot">&lt;-</span> <span class="fu">rnorm</span>(<span class="dv">100</span>)</span>
-<span id="cb229-7"><a href="ml.html#cb229-7" tabindex="-1"></a>y <span class="ot">&lt;-</span> x</span>
-<span id="cb229-8"><a href="ml.html#cb229-8" tabindex="-1"></a>y <span class="ot">&lt;-</span> <span class="fu">rbinom</span>(<span class="dv">100</span>, <span class="at">size =</span> <span class="dv">1</span>, <span class="at">prob =</span> <span class="fu">inv_log</span>(<span class="fl">1.2</span> <span class="sc">*</span> x))</span>
-<span id="cb229-9"><a href="ml.html#cb229-9" tabindex="-1"></a></span>
-<span id="cb229-10"><a href="ml.html#cb229-10" tabindex="-1"></a>l_logistic <span class="ot">&lt;-</span> <span class="cf">function</span> (beta, X, y) {</span>
-<span id="cb229-11"><a href="ml.html#cb229-11" tabindex="-1"></a>  logl <span class="ot">&lt;-</span> <span class="sc">-</span><span class="fu">sum</span>(y <span class="sc">*</span> <span class="fu">log</span>(<span class="fu">inv_log</span>(<span class="fu">as.vector</span>(beta <span class="sc">%*%</span> X))) <span class="sc">+</span> (<span class="dv">1</span> <span class="sc">-</span> y) <span class="sc">*</span> <span class="fu">log</span>((<span class="dv">1</span> <span class="sc">-</span> <span class="fu">inv_log</span>(<span class="fu">as.vector</span>(beta <span class="sc">%*%</span> X)))))</span>
-<span id="cb229-12"><a href="ml.html#cb229-12" tabindex="-1"></a>  <span class="fu">return</span>(logl)</span>
-<span id="cb229-13"><a href="ml.html#cb229-13" tabindex="-1"></a>}</span>
-<span id="cb229-14"><a href="ml.html#cb229-14" tabindex="-1"></a></span>
-<span id="cb229-15"><a href="ml.html#cb229-15" tabindex="-1"></a>my_optim <span class="ot">&lt;-</span> <span class="fu">optim</span>(<span class="at">par =</span> <span class="fl">0.5</span>, <span class="at">fn =</span> l_logistic, <span class="at">method =</span> <span class="st">&quot;L-BFGS-B&quot;</span>,</span>
-<span id="cb229-16"><a href="ml.html#cb229-16" tabindex="-1"></a>                  <span class="at">lower =</span> <span class="dv">0</span>, <span class="at">upper =</span> <span class="dv">10</span>, <span class="at">X =</span> x, <span class="at">y =</span> y)</span>
-<span id="cb229-17"><a href="ml.html#cb229-17" tabindex="-1"></a>my_optim<span class="sc">$</span>par</span></code></pre></div>
+<div class="sourceCode" id="cb3"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb3-1"><a href="ml.html#cb3-1" aria-hidden="true" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">1</span>)</span>
+<span id="cb3-2"><a href="ml.html#cb3-2" aria-hidden="true" tabindex="-1"></a>inv_log <span class="ot">&lt;-</span> <span class="cf">function</span> (z) {</span>
+<span id="cb3-3"><a href="ml.html#cb3-3" aria-hidden="true" tabindex="-1"></a>  <span class="fu">return</span> (<span class="dv">1</span> <span class="sc">/</span> (<span class="dv">1</span> <span class="sc">+</span> <span class="fu">exp</span>(<span class="sc">-</span>z)))</span>
+<span id="cb3-4"><a href="ml.html#cb3-4" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb3-5"><a href="ml.html#cb3-5" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb3-6"><a href="ml.html#cb3-6" aria-hidden="true" tabindex="-1"></a>x <span class="ot">&lt;-</span> <span class="fu">rnorm</span>(<span class="dv">100</span>)</span>
+<span id="cb3-7"><a href="ml.html#cb3-7" aria-hidden="true" tabindex="-1"></a>y <span class="ot">&lt;-</span> x</span>
+<span id="cb3-8"><a href="ml.html#cb3-8" aria-hidden="true" tabindex="-1"></a>y <span class="ot">&lt;-</span> <span class="fu">rbinom</span>(<span class="dv">100</span>, <span class="at">size =</span> <span class="dv">1</span>, <span class="at">prob =</span> <span class="fu">inv_log</span>(<span class="fl">1.2</span> <span class="sc">*</span> x))</span>
+<span id="cb3-9"><a href="ml.html#cb3-9" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb3-10"><a href="ml.html#cb3-10" aria-hidden="true" tabindex="-1"></a>l_logistic <span class="ot">&lt;-</span> <span class="cf">function</span> (beta, X, y) {</span>
+<span id="cb3-11"><a href="ml.html#cb3-11" aria-hidden="true" tabindex="-1"></a>  logl <span class="ot">&lt;-</span> <span class="sc">-</span><span class="fu">sum</span>(y <span class="sc">*</span> <span class="fu">log</span>(<span class="fu">inv_log</span>(<span class="fu">as.vector</span>(beta <span class="sc">%*%</span> X))) <span class="sc">+</span> (<span class="dv">1</span> <span class="sc">-</span> y) <span class="sc">*</span> <span class="fu">log</span>((<span class="dv">1</span> <span class="sc">-</span> <span class="fu">inv_log</span>(<span class="fu">as.vector</span>(beta <span class="sc">%*%</span> X)))))</span>
+<span id="cb3-12"><a href="ml.html#cb3-12" aria-hidden="true" tabindex="-1"></a>  <span class="fu">return</span>(logl)</span>
+<span id="cb3-13"><a href="ml.html#cb3-13" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb3-14"><a href="ml.html#cb3-14" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb3-15"><a href="ml.html#cb3-15" aria-hidden="true" tabindex="-1"></a>my_optim <span class="ot">&lt;-</span> <span class="fu">optim</span>(<span class="at">par =</span> <span class="fl">0.5</span>, <span class="at">fn =</span> l_logistic, <span class="at">method =</span> <span class="st">&quot;L-BFGS-B&quot;</span>,</span>
+<span id="cb3-16"><a href="ml.html#cb3-16" aria-hidden="true" tabindex="-1"></a>                  <span class="at">lower =</span> <span class="dv">0</span>, <span class="at">upper =</span> <span class="dv">10</span>, <span class="at">X =</span> x, <span class="at">y =</span> y)</span>
+<span id="cb3-17"><a href="ml.html#cb3-17" aria-hidden="true" tabindex="-1"></a>my_optim<span class="sc">$</span>par</span></code></pre></div>
 <pre><code>## [1] 1.166558</code></pre>
-<div class="sourceCode" id="cb231"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb231-1"><a href="ml.html#cb231-1" tabindex="-1"></a>truth_p <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="at">x =</span> x, <span class="at">prob =</span> <span class="fu">inv_log</span>(<span class="fl">1.2</span> <span class="sc">*</span> x), <span class="at">type =</span> <span class="st">&quot;truth&quot;</span>)</span>
-<span id="cb231-2"><a href="ml.html#cb231-2" tabindex="-1"></a>est_p   <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="at">x =</span> x, <span class="at">prob =</span> <span class="fu">inv_log</span>(my_optim<span class="sc">$</span>par <span class="sc">*</span> x), <span class="at">type =</span> <span class="st">&quot;estimated&quot;</span>)</span>
-<span id="cb231-3"><a href="ml.html#cb231-3" tabindex="-1"></a>plot_df <span class="ot">&lt;-</span> <span class="fu">rbind</span>(truth_p, est_p)</span>
-<span id="cb231-4"><a href="ml.html#cb231-4" tabindex="-1"></a><span class="fu">ggplot</span>(<span class="at">data =</span> plot_df, <span class="fu">aes</span>(<span class="at">x =</span> x, <span class="at">y =</span> prob, <span class="at">color =</span> type)) <span class="sc">+</span></span>
-<span id="cb231-5"><a href="ml.html#cb231-5" tabindex="-1"></a>  <span class="fu">geom_point</span>(<span class="at">alpha =</span> <span class="fl">0.3</span>)</span></code></pre></div>
-<p><img src="bookdown-pou_files/figure-html/unnamed-chunk-241-1.png" width="672" /></p>
-<div class="sourceCode" id="cb232"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb232-1"><a href="ml.html#cb232-1" tabindex="-1"></a>y2 <span class="ot">&lt;-</span> <span class="fu">rbinom</span>(<span class="dv">2000</span>, <span class="at">size =</span> <span class="dv">1</span>, <span class="at">prob =</span> <span class="fu">inv_log</span>(<span class="fl">1.2</span> <span class="sc">*</span> x <span class="sc">+</span> <span class="fl">1.4</span> <span class="sc">*</span> x<span class="sc">^</span><span class="dv">2</span>))</span>
-<span id="cb232-2"><a href="ml.html#cb232-2" tabindex="-1"></a>X2 <span class="ot">&lt;-</span> <span class="fu">cbind</span>(x, x<span class="sc">^</span><span class="dv">2</span>)</span>
-<span id="cb232-3"><a href="ml.html#cb232-3" tabindex="-1"></a>my_optim2 <span class="ot">&lt;-</span> <span class="fu">optim</span>(<span class="at">par =</span> <span class="fu">c</span>(<span class="dv">0</span>, <span class="dv">0</span>), <span class="at">fn =</span> l_logistic, <span class="at">method =</span> <span class="st">&quot;L-BFGS-B&quot;</span>,</span>
-<span id="cb232-4"><a href="ml.html#cb232-4" tabindex="-1"></a>                   <span class="at">lower =</span> <span class="fu">c</span>(<span class="dv">0</span>, <span class="dv">0</span>), <span class="at">upper =</span> <span class="fu">c</span>(<span class="dv">2</span>, <span class="dv">2</span>), <span class="at">X =</span> <span class="fu">t</span>(X2), <span class="at">y =</span> y2)</span>
-<span id="cb232-5"><a href="ml.html#cb232-5" tabindex="-1"></a>my_optim2<span class="sc">$</span>par</span></code></pre></div>
+<div class="sourceCode" id="cb5"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb5-1"><a href="ml.html#cb5-1" aria-hidden="true" tabindex="-1"></a>truth_p <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="at">x =</span> x, <span class="at">prob =</span> <span class="fu">inv_log</span>(<span class="fl">1.2</span> <span class="sc">*</span> x), <span class="at">type =</span> <span class="st">&quot;truth&quot;</span>)</span>
+<span id="cb5-2"><a href="ml.html#cb5-2" aria-hidden="true" tabindex="-1"></a>est_p   <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="at">x =</span> x, <span class="at">prob =</span> <span class="fu">inv_log</span>(my_optim<span class="sc">$</span>par <span class="sc">*</span> x), <span class="at">type =</span> <span class="st">&quot;estimated&quot;</span>)</span>
+<span id="cb5-3"><a href="ml.html#cb5-3" aria-hidden="true" tabindex="-1"></a>plot_df <span class="ot">&lt;-</span> <span class="fu">rbind</span>(truth_p, est_p)</span>
+<span id="cb5-4"><a href="ml.html#cb5-4" aria-hidden="true" tabindex="-1"></a><span class="fu">ggplot</span>(<span class="at">data =</span> plot_df, <span class="fu">aes</span>(<span class="at">x =</span> x, <span class="at">y =</span> prob, <span class="at">color =</span> type)) <span class="sc">+</span></span>
+<span id="cb5-5"><a href="ml.html#cb5-5" aria-hidden="true" tabindex="-1"></a>  <span class="fu">geom_point</span>(<span class="at">alpha =</span> <span class="fl">0.3</span>)</span></code></pre></div>
+<p><img src="bookdown-pou_files/figure-html/unnamed-chunk-9-1.png" width="672" /></p>
+<div class="sourceCode" id="cb6"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb6-1"><a href="ml.html#cb6-1" aria-hidden="true" tabindex="-1"></a>y2 <span class="ot">&lt;-</span> <span class="fu">rbinom</span>(<span class="dv">2000</span>, <span class="at">size =</span> <span class="dv">1</span>, <span class="at">prob =</span> <span class="fu">inv_log</span>(<span class="fl">1.2</span> <span class="sc">*</span> x <span class="sc">+</span> <span class="fl">1.4</span> <span class="sc">*</span> x<span class="sc">^</span><span class="dv">2</span>))</span>
+<span id="cb6-2"><a href="ml.html#cb6-2" aria-hidden="true" tabindex="-1"></a>X2 <span class="ot">&lt;-</span> <span class="fu">cbind</span>(x, x<span class="sc">^</span><span class="dv">2</span>)</span>
+<span id="cb6-3"><a href="ml.html#cb6-3" aria-hidden="true" tabindex="-1"></a>my_optim2 <span class="ot">&lt;-</span> <span class="fu">optim</span>(<span class="at">par =</span> <span class="fu">c</span>(<span class="dv">0</span>, <span class="dv">0</span>), <span class="at">fn =</span> l_logistic, <span class="at">method =</span> <span class="st">&quot;L-BFGS-B&quot;</span>,</span>
+<span id="cb6-4"><a href="ml.html#cb6-4" aria-hidden="true" tabindex="-1"></a>                   <span class="at">lower =</span> <span class="fu">c</span>(<span class="dv">0</span>, <span class="dv">0</span>), <span class="at">upper =</span> <span class="fu">c</span>(<span class="dv">2</span>, <span class="dv">2</span>), <span class="at">X =</span> <span class="fu">t</span>(X2), <span class="at">y =</span> y2)</span>
+<span id="cb6-5"><a href="ml.html#cb6-5" aria-hidden="true" tabindex="-1"></a>my_optim2<span class="sc">$</span>par</span></code></pre></div>
 <pre><code>## [1] 1.153656 1.257649</code></pre>
-<div class="sourceCode" id="cb234"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb234-1"><a href="ml.html#cb234-1" tabindex="-1"></a>tmp     <span class="ot">&lt;-</span> <span class="fu">sweep</span>(<span class="fu">data.frame</span>(<span class="at">x =</span> x, <span class="at">x2 =</span> x<span class="sc">^</span><span class="dv">2</span>), <span class="dv">2</span>, my_optim2<span class="sc">$</span>par, <span class="at">FUN =</span> <span class="st">&quot;*&quot;</span>)</span>
-<span id="cb234-2"><a href="ml.html#cb234-2" tabindex="-1"></a>tmp     <span class="ot">&lt;-</span> tmp[ ,<span class="dv">1</span>] <span class="sc">+</span> tmp[ ,<span class="dv">2</span>]</span>
-<span id="cb234-3"><a href="ml.html#cb234-3" tabindex="-1"></a>truth_p <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="at">x =</span> x, <span class="at">prob =</span> <span class="fu">inv_log</span>(<span class="fl">1.2</span> <span class="sc">*</span> x <span class="sc">+</span> <span class="fl">1.4</span> <span class="sc">*</span> x<span class="sc">^</span><span class="dv">2</span>), <span class="at">type =</span> <span class="st">&quot;truth&quot;</span>)</span>
-<span id="cb234-4"><a href="ml.html#cb234-4" tabindex="-1"></a>est_p   <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="at">x =</span> x, <span class="at">prob =</span> <span class="fu">inv_log</span>(tmp), <span class="at">type =</span> <span class="st">&quot;estimated&quot;</span>)</span>
-<span id="cb234-5"><a href="ml.html#cb234-5" tabindex="-1"></a>plot_df <span class="ot">&lt;-</span> <span class="fu">rbind</span>(truth_p, est_p)</span>
-<span id="cb234-6"><a href="ml.html#cb234-6" tabindex="-1"></a><span class="fu">ggplot</span>(<span class="at">data =</span> plot_df, <span class="fu">aes</span>(<span class="at">x =</span> x, <span class="at">y =</span> prob, <span class="at">color =</span> type)) <span class="sc">+</span></span>
-<span id="cb234-7"><a href="ml.html#cb234-7" tabindex="-1"></a>  <span class="fu">geom_point</span>(<span class="at">alpha =</span> <span class="fl">0.3</span>)</span></code></pre></div>
-<p><img src="bookdown-pou_files/figure-html/unnamed-chunk-241-2.png" width="672" /></p>
+<div class="sourceCode" id="cb8"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb8-1"><a href="ml.html#cb8-1" aria-hidden="true" tabindex="-1"></a>tmp     <span class="ot">&lt;-</span> <span class="fu">sweep</span>(<span class="fu">data.frame</span>(<span class="at">x =</span> x, <span class="at">x2 =</span> x<span class="sc">^</span><span class="dv">2</span>), <span class="dv">2</span>, my_optim2<span class="sc">$</span>par, <span class="at">FUN =</span> <span class="st">&quot;*&quot;</span>)</span>
+<span id="cb8-2"><a href="ml.html#cb8-2" aria-hidden="true" tabindex="-1"></a>tmp     <span class="ot">&lt;-</span> tmp[ ,<span class="dv">1</span>] <span class="sc">+</span> tmp[ ,<span class="dv">2</span>]</span>
+<span id="cb8-3"><a href="ml.html#cb8-3" aria-hidden="true" tabindex="-1"></a>truth_p <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="at">x =</span> x, <span class="at">prob =</span> <span class="fu">inv_log</span>(<span class="fl">1.2</span> <span class="sc">*</span> x <span class="sc">+</span> <span class="fl">1.4</span> <span class="sc">*</span> x<span class="sc">^</span><span class="dv">2</span>), <span class="at">type =</span> <span class="st">&quot;truth&quot;</span>)</span>
+<span id="cb8-4"><a href="ml.html#cb8-4" aria-hidden="true" tabindex="-1"></a>est_p   <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="at">x =</span> x, <span class="at">prob =</span> <span class="fu">inv_log</span>(tmp), <span class="at">type =</span> <span class="st">&quot;estimated&quot;</span>)</span>
+<span id="cb8-5"><a href="ml.html#cb8-5" aria-hidden="true" tabindex="-1"></a>plot_df <span class="ot">&lt;-</span> <span class="fu">rbind</span>(truth_p, est_p)</span>
+<span id="cb8-6"><a href="ml.html#cb8-6" aria-hidden="true" tabindex="-1"></a><span class="fu">ggplot</span>(<span class="at">data =</span> plot_df, <span class="fu">aes</span>(<span class="at">x =</span> x, <span class="at">y =</span> prob, <span class="at">color =</span> type)) <span class="sc">+</span></span>
+<span id="cb8-7"><a href="ml.html#cb8-7" aria-hidden="true" tabindex="-1"></a>  <span class="fu">geom_point</span>(<span class="at">alpha =</span> <span class="fl">0.3</span>)</span></code></pre></div>
+<p><img src="bookdown-pou_files/figure-html/unnamed-chunk-9-2.png" width="672" /></p>
 </div>
 <div class="exercise">
-<p><span id="exr:unnamed-chunk-242" class="exercise"><strong>Exercise 15.4  (Linear regression) </strong></span><span style="color:blue">For the data generated below, do the following:</span></p>
+<p><span id="exr:unnamed-chunk-10" class="exercise"><strong>Exercise 15.4  (Linear regression) </strong></span><span style="color:blue">For the data generated below, do the following:</span></p>
 <ol style="list-style-type: lower-alpha">
 <li><span style="color:blue">Compute the least squares (MLE) estimate of coefficients beta using the matrix exact solution.</span></li>
 <li><span style="color:blue">Compute the MLE by minimizing the sum of squared residuals using black-box optimization (<em>optim()</em>).</span></li>
@@ -509,37 +509,37 @@ <h2><span class="header-section-number">15.1</span> Deriving MLE<a href="ml.html
 <li><span style="color:blue">Compute 95% CI on the beta coefficients by using (a or b) and the bootstrap with percentile method for CI. Compare with d.</span></li>
 </ol>
 </div>
-<div class="sourceCode" id="cb235"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb235-1"><a href="ml.html#cb235-1" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">1</span>)</span>
-<span id="cb235-2"><a href="ml.html#cb235-2" tabindex="-1"></a>n <span class="ot">&lt;-</span> <span class="dv">100</span></span>
-<span id="cb235-3"><a href="ml.html#cb235-3" tabindex="-1"></a>x1 <span class="ot">&lt;-</span> <span class="fu">rnorm</span>(n)</span>
-<span id="cb235-4"><a href="ml.html#cb235-4" tabindex="-1"></a>x2 <span class="ot">&lt;-</span> <span class="fu">rnorm</span>(n)</span>
-<span id="cb235-5"><a href="ml.html#cb235-5" tabindex="-1"></a>x3 <span class="ot">&lt;-</span> <span class="fu">rnorm</span>(n)</span>
-<span id="cb235-6"><a href="ml.html#cb235-6" tabindex="-1"></a></span>
-<span id="cb235-7"><a href="ml.html#cb235-7" tabindex="-1"></a>X <span class="ot">&lt;-</span> <span class="fu">cbind</span>(x1, x2, x3)</span>
-<span id="cb235-8"><a href="ml.html#cb235-8" tabindex="-1"></a>beta <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="fl">0.2</span>, <span class="fl">0.6</span>, <span class="sc">-</span><span class="fl">1.2</span>)</span>
-<span id="cb235-9"><a href="ml.html#cb235-9" tabindex="-1"></a></span>
-<span id="cb235-10"><a href="ml.html#cb235-10" tabindex="-1"></a>y <span class="ot">&lt;-</span> <span class="fu">as.vector</span>(<span class="fu">t</span>(beta <span class="sc">%*%</span> <span class="fu">t</span>(X))) <span class="sc">+</span> <span class="fu">rnorm</span>(n, <span class="at">sd =</span> <span class="fl">0.2</span>)</span></code></pre></div>
+<div class="sourceCode" id="cb9"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb9-1"><a href="ml.html#cb9-1" aria-hidden="true" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">1</span>)</span>
+<span id="cb9-2"><a href="ml.html#cb9-2" aria-hidden="true" tabindex="-1"></a>n <span class="ot">&lt;-</span> <span class="dv">100</span></span>
+<span id="cb9-3"><a href="ml.html#cb9-3" aria-hidden="true" tabindex="-1"></a>x1 <span class="ot">&lt;-</span> <span class="fu">rnorm</span>(n)</span>
+<span id="cb9-4"><a href="ml.html#cb9-4" aria-hidden="true" tabindex="-1"></a>x2 <span class="ot">&lt;-</span> <span class="fu">rnorm</span>(n)</span>
+<span id="cb9-5"><a href="ml.html#cb9-5" aria-hidden="true" tabindex="-1"></a>x3 <span class="ot">&lt;-</span> <span class="fu">rnorm</span>(n)</span>
+<span id="cb9-6"><a href="ml.html#cb9-6" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb9-7"><a href="ml.html#cb9-7" aria-hidden="true" tabindex="-1"></a>X <span class="ot">&lt;-</span> <span class="fu">cbind</span>(x1, x2, x3)</span>
+<span id="cb9-8"><a href="ml.html#cb9-8" aria-hidden="true" tabindex="-1"></a>beta <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="fl">0.2</span>, <span class="fl">0.6</span>, <span class="sc">-</span><span class="fl">1.2</span>)</span>
+<span id="cb9-9"><a href="ml.html#cb9-9" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb9-10"><a href="ml.html#cb9-10" aria-hidden="true" tabindex="-1"></a>y <span class="ot">&lt;-</span> <span class="fu">as.vector</span>(<span class="fu">t</span>(beta <span class="sc">%*%</span> <span class="fu">t</span>(X))) <span class="sc">+</span> <span class="fu">rnorm</span>(n, <span class="at">sd =</span> <span class="fl">0.2</span>)</span></code></pre></div>
 <div class="fold">
-<div class="sourceCode" id="cb236"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb236-1"><a href="ml.html#cb236-1" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">1</span>)</span>
-<span id="cb236-2"><a href="ml.html#cb236-2" tabindex="-1"></a>n <span class="ot">&lt;-</span> <span class="dv">100</span></span>
-<span id="cb236-3"><a href="ml.html#cb236-3" tabindex="-1"></a>x1 <span class="ot">&lt;-</span> <span class="fu">rnorm</span>(n)</span>
-<span id="cb236-4"><a href="ml.html#cb236-4" tabindex="-1"></a>x2 <span class="ot">&lt;-</span> <span class="fu">rnorm</span>(n)</span>
-<span id="cb236-5"><a href="ml.html#cb236-5" tabindex="-1"></a>x3 <span class="ot">&lt;-</span> <span class="fu">rnorm</span>(n)</span>
-<span id="cb236-6"><a href="ml.html#cb236-6" tabindex="-1"></a></span>
-<span id="cb236-7"><a href="ml.html#cb236-7" tabindex="-1"></a>X <span class="ot">&lt;-</span> <span class="fu">cbind</span>(x1, x2, x3)</span>
-<span id="cb236-8"><a href="ml.html#cb236-8" tabindex="-1"></a>beta <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="fl">0.2</span>, <span class="fl">0.6</span>, <span class="sc">-</span><span class="fl">1.2</span>)</span>
-<span id="cb236-9"><a href="ml.html#cb236-9" tabindex="-1"></a></span>
-<span id="cb236-10"><a href="ml.html#cb236-10" tabindex="-1"></a>y <span class="ot">&lt;-</span> <span class="fu">as.vector</span>(<span class="fu">t</span>(beta <span class="sc">%*%</span> <span class="fu">t</span>(X))) <span class="sc">+</span> <span class="fu">rnorm</span>(n, <span class="at">sd =</span> <span class="fl">0.2</span>)</span>
-<span id="cb236-11"><a href="ml.html#cb236-11" tabindex="-1"></a>LS_fun <span class="ot">&lt;-</span> <span class="cf">function</span> (beta, X, y) {</span>
-<span id="cb236-12"><a href="ml.html#cb236-12" tabindex="-1"></a>  <span class="fu">return</span>(<span class="fu">sum</span>((y <span class="sc">-</span> beta <span class="sc">%*%</span> <span class="fu">t</span>(X))<span class="sc">^</span><span class="dv">2</span>))</span>
-<span id="cb236-13"><a href="ml.html#cb236-13" tabindex="-1"></a>}</span>
-<span id="cb236-14"><a href="ml.html#cb236-14" tabindex="-1"></a>my_optim <span class="ot">&lt;-</span> <span class="fu">optim</span>(<span class="at">par =</span> <span class="fu">c</span>(<span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>), <span class="at">fn =</span> LS_fun, <span class="at">lower =</span> <span class="sc">-</span><span class="dv">5</span>, <span class="at">upper =</span> <span class="dv">5</span>,</span>
-<span id="cb236-15"><a href="ml.html#cb236-15" tabindex="-1"></a>                  <span class="at">X =</span> X, <span class="at">y =</span> y, <span class="at">method =</span> <span class="st">&quot;L-BFGS-B&quot;</span>)</span>
-<span id="cb236-16"><a href="ml.html#cb236-16" tabindex="-1"></a>my_optim<span class="sc">$</span>par</span></code></pre></div>
+<div class="sourceCode" id="cb10"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb10-1"><a href="ml.html#cb10-1" aria-hidden="true" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">1</span>)</span>
+<span id="cb10-2"><a href="ml.html#cb10-2" aria-hidden="true" tabindex="-1"></a>n <span class="ot">&lt;-</span> <span class="dv">100</span></span>
+<span id="cb10-3"><a href="ml.html#cb10-3" aria-hidden="true" tabindex="-1"></a>x1 <span class="ot">&lt;-</span> <span class="fu">rnorm</span>(n)</span>
+<span id="cb10-4"><a href="ml.html#cb10-4" aria-hidden="true" tabindex="-1"></a>x2 <span class="ot">&lt;-</span> <span class="fu">rnorm</span>(n)</span>
+<span id="cb10-5"><a href="ml.html#cb10-5" aria-hidden="true" tabindex="-1"></a>x3 <span class="ot">&lt;-</span> <span class="fu">rnorm</span>(n)</span>
+<span id="cb10-6"><a href="ml.html#cb10-6" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb10-7"><a href="ml.html#cb10-7" aria-hidden="true" tabindex="-1"></a>X <span class="ot">&lt;-</span> <span class="fu">cbind</span>(x1, x2, x3)</span>
+<span id="cb10-8"><a href="ml.html#cb10-8" aria-hidden="true" tabindex="-1"></a>beta <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="fl">0.2</span>, <span class="fl">0.6</span>, <span class="sc">-</span><span class="fl">1.2</span>)</span>
+<span id="cb10-9"><a href="ml.html#cb10-9" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb10-10"><a href="ml.html#cb10-10" aria-hidden="true" tabindex="-1"></a>y <span class="ot">&lt;-</span> <span class="fu">as.vector</span>(<span class="fu">t</span>(beta <span class="sc">%*%</span> <span class="fu">t</span>(X))) <span class="sc">+</span> <span class="fu">rnorm</span>(n, <span class="at">sd =</span> <span class="fl">0.2</span>)</span>
+<span id="cb10-11"><a href="ml.html#cb10-11" aria-hidden="true" tabindex="-1"></a>LS_fun <span class="ot">&lt;-</span> <span class="cf">function</span> (beta, X, y) {</span>
+<span id="cb10-12"><a href="ml.html#cb10-12" aria-hidden="true" tabindex="-1"></a>  <span class="fu">return</span>(<span class="fu">sum</span>((y <span class="sc">-</span> beta <span class="sc">%*%</span> <span class="fu">t</span>(X))<span class="sc">^</span><span class="dv">2</span>))</span>
+<span id="cb10-13"><a href="ml.html#cb10-13" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb10-14"><a href="ml.html#cb10-14" aria-hidden="true" tabindex="-1"></a>my_optim <span class="ot">&lt;-</span> <span class="fu">optim</span>(<span class="at">par =</span> <span class="fu">c</span>(<span class="dv">0</span>, <span class="dv">0</span>, <span class="dv">0</span>), <span class="at">fn =</span> LS_fun, <span class="at">lower =</span> <span class="sc">-</span><span class="dv">5</span>, <span class="at">upper =</span> <span class="dv">5</span>,</span>
+<span id="cb10-15"><a href="ml.html#cb10-15" aria-hidden="true" tabindex="-1"></a>                  <span class="at">X =</span> X, <span class="at">y =</span> y, <span class="at">method =</span> <span class="st">&quot;L-BFGS-B&quot;</span>)</span>
+<span id="cb10-16"><a href="ml.html#cb10-16" aria-hidden="true" tabindex="-1"></a>my_optim<span class="sc">$</span>par</span></code></pre></div>
 <pre><code>## [1]  0.1898162  0.5885946 -1.1788264</code></pre>
-<div class="sourceCode" id="cb238"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb238-1"><a href="ml.html#cb238-1" tabindex="-1"></a>df <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="at">y =</span> y, <span class="at">x1 =</span> x1, <span class="at">x2 =</span> x2, <span class="at">x3 =</span> x3)</span>
-<span id="cb238-2"><a href="ml.html#cb238-2" tabindex="-1"></a>my_lm <span class="ot">&lt;-</span> <span class="fu">lm</span>(y <span class="sc">~</span> x1 <span class="sc">+</span> x2 <span class="sc">+</span> x3 <span class="sc">-</span> <span class="dv">1</span>, <span class="at">data =</span> df)</span>
-<span id="cb238-3"><a href="ml.html#cb238-3" tabindex="-1"></a>my_lm</span></code></pre></div>
+<div class="sourceCode" id="cb12"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb12-1"><a href="ml.html#cb12-1" aria-hidden="true" tabindex="-1"></a>df <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="at">y =</span> y, <span class="at">x1 =</span> x1, <span class="at">x2 =</span> x2, <span class="at">x3 =</span> x3)</span>
+<span id="cb12-2"><a href="ml.html#cb12-2" aria-hidden="true" tabindex="-1"></a>my_lm <span class="ot">&lt;-</span> <span class="fu">lm</span>(y <span class="sc">~</span> x1 <span class="sc">+</span> x2 <span class="sc">+</span> x3 <span class="sc">-</span> <span class="dv">1</span>, <span class="at">data =</span> df)</span>
+<span id="cb12-3"><a href="ml.html#cb12-3" aria-hidden="true" tabindex="-1"></a>my_lm</span></code></pre></div>
 <pre><code>## 
 ## Call:
 ## lm(formula = y ~ x1 + x2 + x3 - 1, data = df)
@@ -547,41 +547,41 @@ <h2><span class="header-section-number">15.1</span> Deriving MLE<a href="ml.html
 ## Coefficients:
 ##      x1       x2       x3  
 ##  0.1898   0.5886  -1.1788</code></pre>
-<div class="sourceCode" id="cb240"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb240-1"><a href="ml.html#cb240-1" tabindex="-1"></a><span class="co"># matrix solution</span></span>
-<span id="cb240-2"><a href="ml.html#cb240-2" tabindex="-1"></a>beta_hat <span class="ot">&lt;-</span> <span class="fu">solve</span>(<span class="fu">t</span>(X) <span class="sc">%*%</span> X) <span class="sc">%*%</span> <span class="fu">t</span>(X) <span class="sc">%*%</span> y</span>
-<span id="cb240-3"><a href="ml.html#cb240-3" tabindex="-1"></a>beta_hat</span></code></pre></div>
+<div class="sourceCode" id="cb14"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb14-1"><a href="ml.html#cb14-1" aria-hidden="true" tabindex="-1"></a><span class="co"># matrix solution</span></span>
+<span id="cb14-2"><a href="ml.html#cb14-2" aria-hidden="true" tabindex="-1"></a>beta_hat <span class="ot">&lt;-</span> <span class="fu">solve</span>(<span class="fu">t</span>(X) <span class="sc">%*%</span> X) <span class="sc">%*%</span> <span class="fu">t</span>(X) <span class="sc">%*%</span> y</span>
+<span id="cb14-3"><a href="ml.html#cb14-3" aria-hidden="true" tabindex="-1"></a>beta_hat</span></code></pre></div>
 <pre><code>##          [,1]
 ## x1  0.1898162
 ## x2  0.5885946
 ## x3 -1.1788264</code></pre>
-<div class="sourceCode" id="cb242"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb242-1"><a href="ml.html#cb242-1" tabindex="-1"></a>out <span class="ot">&lt;-</span> <span class="fu">summary</span>(my_lm)</span>
-<span id="cb242-2"><a href="ml.html#cb242-2" tabindex="-1"></a>out<span class="sc">$</span>coefficients[ ,<span class="dv">2</span>]</span></code></pre></div>
+<div class="sourceCode" id="cb16"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb16-1"><a href="ml.html#cb16-1" aria-hidden="true" tabindex="-1"></a>out <span class="ot">&lt;-</span> <span class="fu">summary</span>(my_lm)</span>
+<span id="cb16-2"><a href="ml.html#cb16-2" aria-hidden="true" tabindex="-1"></a>out<span class="sc">$</span>coefficients[ ,<span class="dv">2</span>]</span></code></pre></div>
 <pre><code>##         x1         x2         x3 
 ## 0.02209328 0.02087542 0.01934506</code></pre>
-<div class="sourceCode" id="cb244"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb244-1"><a href="ml.html#cb244-1" tabindex="-1"></a><span class="co"># bootstrap CI</span></span>
-<span id="cb244-2"><a href="ml.html#cb244-2" tabindex="-1"></a>nboot <span class="ot">&lt;-</span> <span class="dv">1000</span></span>
-<span id="cb244-3"><a href="ml.html#cb244-3" tabindex="-1"></a>beta_boot <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="at">data =</span> <span class="cn">NA</span>, <span class="at">ncol =</span> <span class="fu">length</span>(beta), <span class="at">nrow =</span> nboot)</span>
-<span id="cb244-4"><a href="ml.html#cb244-4" tabindex="-1"></a><span class="cf">for</span> (i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>nboot) {</span>
-<span id="cb244-5"><a href="ml.html#cb244-5" tabindex="-1"></a>  inds     <span class="ot">&lt;-</span> <span class="fu">sample</span>(<span class="dv">1</span><span class="sc">:</span>n, n, <span class="at">replace =</span> T)</span>
-<span id="cb244-6"><a href="ml.html#cb244-6" tabindex="-1"></a>  new_df   <span class="ot">&lt;-</span> df[inds, ]</span>
-<span id="cb244-7"><a href="ml.html#cb244-7" tabindex="-1"></a>  X_tmp    <span class="ot">&lt;-</span> <span class="fu">as.matrix</span>(new_df[ ,<span class="sc">-</span><span class="dv">1</span>])</span>
-<span id="cb244-8"><a href="ml.html#cb244-8" tabindex="-1"></a>  y_tmp    <span class="ot">&lt;-</span> new_df[ ,<span class="dv">1</span>]</span>
-<span id="cb244-9"><a href="ml.html#cb244-9" tabindex="-1"></a>  <span class="co"># print(nrow(new_df))</span></span>
-<span id="cb244-10"><a href="ml.html#cb244-10" tabindex="-1"></a>  tmp_beta <span class="ot">&lt;-</span> <span class="fu">solve</span>(<span class="fu">t</span>(X_tmp) <span class="sc">%*%</span> X_tmp) <span class="sc">%*%</span> <span class="fu">t</span>(X_tmp) <span class="sc">%*%</span> y_tmp</span>
-<span id="cb244-11"><a href="ml.html#cb244-11" tabindex="-1"></a>  beta_boot[i, ] <span class="ot">&lt;-</span> tmp_beta</span>
-<span id="cb244-12"><a href="ml.html#cb244-12" tabindex="-1"></a>}</span>
-<span id="cb244-13"><a href="ml.html#cb244-13" tabindex="-1"></a><span class="fu">apply</span>(beta_boot, <span class="dv">2</span>, mean)</span></code></pre></div>
+<div class="sourceCode" id="cb18"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb18-1"><a href="ml.html#cb18-1" aria-hidden="true" tabindex="-1"></a><span class="co"># bootstrap CI</span></span>
+<span id="cb18-2"><a href="ml.html#cb18-2" aria-hidden="true" tabindex="-1"></a>nboot <span class="ot">&lt;-</span> <span class="dv">1000</span></span>
+<span id="cb18-3"><a href="ml.html#cb18-3" aria-hidden="true" tabindex="-1"></a>beta_boot <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="at">data =</span> <span class="cn">NA</span>, <span class="at">ncol =</span> <span class="fu">length</span>(beta), <span class="at">nrow =</span> nboot)</span>
+<span id="cb18-4"><a href="ml.html#cb18-4" aria-hidden="true" tabindex="-1"></a><span class="cf">for</span> (i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>nboot) {</span>
+<span id="cb18-5"><a href="ml.html#cb18-5" aria-hidden="true" tabindex="-1"></a>  inds     <span class="ot">&lt;-</span> <span class="fu">sample</span>(<span class="dv">1</span><span class="sc">:</span>n, n, <span class="at">replace =</span> T)</span>
+<span id="cb18-6"><a href="ml.html#cb18-6" aria-hidden="true" tabindex="-1"></a>  new_df   <span class="ot">&lt;-</span> df[inds, ]</span>
+<span id="cb18-7"><a href="ml.html#cb18-7" aria-hidden="true" tabindex="-1"></a>  X_tmp    <span class="ot">&lt;-</span> <span class="fu">as.matrix</span>(new_df[ ,<span class="sc">-</span><span class="dv">1</span>])</span>
+<span id="cb18-8"><a href="ml.html#cb18-8" aria-hidden="true" tabindex="-1"></a>  y_tmp    <span class="ot">&lt;-</span> new_df[ ,<span class="dv">1</span>]</span>
+<span id="cb18-9"><a href="ml.html#cb18-9" aria-hidden="true" tabindex="-1"></a>  <span class="co"># print(nrow(new_df))</span></span>
+<span id="cb18-10"><a href="ml.html#cb18-10" aria-hidden="true" tabindex="-1"></a>  tmp_beta <span class="ot">&lt;-</span> <span class="fu">solve</span>(<span class="fu">t</span>(X_tmp) <span class="sc">%*%</span> X_tmp) <span class="sc">%*%</span> <span class="fu">t</span>(X_tmp) <span class="sc">%*%</span> y_tmp</span>
+<span id="cb18-11"><a href="ml.html#cb18-11" aria-hidden="true" tabindex="-1"></a>  beta_boot[i, ] <span class="ot">&lt;-</span> tmp_beta</span>
+<span id="cb18-12"><a href="ml.html#cb18-12" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb18-13"><a href="ml.html#cb18-13" aria-hidden="true" tabindex="-1"></a><span class="fu">apply</span>(beta_boot, <span class="dv">2</span>, mean)</span></code></pre></div>
 <pre><code>## [1]  0.1893281  0.5887068 -1.1800738</code></pre>
-<div class="sourceCode" id="cb246"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb246-1"><a href="ml.html#cb246-1" tabindex="-1"></a><span class="fu">apply</span>(beta_boot, <span class="dv">2</span>, quantile, <span class="at">probs =</span> <span class="fu">c</span>(<span class="fl">0.025</span>, <span class="fl">0.975</span>))</span></code></pre></div>
+<div class="sourceCode" id="cb20"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb20-1"><a href="ml.html#cb20-1" aria-hidden="true" tabindex="-1"></a><span class="fu">apply</span>(beta_boot, <span class="dv">2</span>, quantile, <span class="at">probs =</span> <span class="fu">c</span>(<span class="fl">0.025</span>, <span class="fl">0.975</span>))</span></code></pre></div>
 <pre><code>##            [,1]      [,2]      [,3]
 ## 2.5%  0.1389441 0.5436911 -1.221560
 ## 97.5% 0.2386295 0.6363102 -1.140416</code></pre>
-<div class="sourceCode" id="cb248"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb248-1"><a href="ml.html#cb248-1" tabindex="-1"></a>out<span class="sc">$</span>coefficients[ ,<span class="dv">2</span>]</span></code></pre></div>
+<div class="sourceCode" id="cb22"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb22-1"><a href="ml.html#cb22-1" aria-hidden="true" tabindex="-1"></a>out<span class="sc">$</span>coefficients[ ,<span class="dv">2</span>]</span></code></pre></div>
 <pre><code>##         x1         x2         x3 
 ## 0.02209328 0.02087542 0.01934506</code></pre>
 </div>
 <div class="exercise">
-<p><span id="exr:unnamed-chunk-245" class="exercise"><strong>Exercise 15.5  (Principal component analysis) </strong></span><span style="color:blue">Load the <em>olympic</em> data set from package <em>ade4</em>. The data show decathlon results for 33 men in 1988 Olympic Games. This data set serves as a great example of finding the latent structure in the data, as there are certain characteristics of the athletes that make them excel at different events. For example an explosive athlete will do particulary well in sprints and long jumps.</span></p>
+<p><span id="exr:unnamed-chunk-13" class="exercise"><strong>Exercise 15.5  (Principal component analysis) </strong></span><span style="color:blue">Load the <em>olympic</em> data set from package <em>ade4</em>. The data show decathlon results for 33 men in 1988 Olympic Games. This data set serves as a great example of finding the latent structure in the data, as there are certain characteristics of the athletes that make them excel at different events. For example an explosive athlete will do particulary well in sprints and long jumps.</span></p>
 <ol style="list-style-type: lower-alpha">
 <li><p><span style="color:blue">Perform PCA (<em>prcomp</em>) on the data set and interpret the first 2 latent dimensions. Hint: Standardize the data first to get meaningful results.</span></p></li>
 <li><p><span style="color:blue">Use MLE to estimate the covariance of the standardized multivariate distribution.</span></p></li>
@@ -589,12 +589,12 @@ <h2><span class="header-section-number">15.1</span> Deriving MLE<a href="ml.html
 </ol>
 </div>
 <div class="fold">
-<div class="sourceCode" id="cb250"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb250-1"><a href="ml.html#cb250-1" tabindex="-1"></a><span class="fu">data</span>(olympic)</span>
-<span id="cb250-2"><a href="ml.html#cb250-2" tabindex="-1"></a></span>
-<span id="cb250-3"><a href="ml.html#cb250-3" tabindex="-1"></a>X        <span class="ot">&lt;-</span> olympic<span class="sc">$</span>tab</span>
-<span id="cb250-4"><a href="ml.html#cb250-4" tabindex="-1"></a>X_scaled <span class="ot">&lt;-</span> <span class="fu">scale</span>(X)</span>
-<span id="cb250-5"><a href="ml.html#cb250-5" tabindex="-1"></a>my_pca   <span class="ot">&lt;-</span> <span class="fu">prcomp</span>(X_scaled)</span>
-<span id="cb250-6"><a href="ml.html#cb250-6" tabindex="-1"></a><span class="fu">summary</span>(my_pca)</span></code></pre></div>
+<div class="sourceCode" id="cb24"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb24-1"><a href="ml.html#cb24-1" aria-hidden="true" tabindex="-1"></a><span class="fu">data</span>(olympic)</span>
+<span id="cb24-2"><a href="ml.html#cb24-2" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb24-3"><a href="ml.html#cb24-3" aria-hidden="true" tabindex="-1"></a>X        <span class="ot">&lt;-</span> olympic<span class="sc">$</span>tab</span>
+<span id="cb24-4"><a href="ml.html#cb24-4" aria-hidden="true" tabindex="-1"></a>X_scaled <span class="ot">&lt;-</span> <span class="fu">scale</span>(X)</span>
+<span id="cb24-5"><a href="ml.html#cb24-5" aria-hidden="true" tabindex="-1"></a>my_pca   <span class="ot">&lt;-</span> <span class="fu">prcomp</span>(X_scaled)</span>
+<span id="cb24-6"><a href="ml.html#cb24-6" aria-hidden="true" tabindex="-1"></a><span class="fu">summary</span>(my_pca)</span></code></pre></div>
 <pre><code>## Importance of components:
 ##                           PC1    PC2     PC3    PC4     PC5     PC6     PC7
 ## Standard deviation     1.8488 1.6144 0.97123 0.9370 0.74607 0.70088 0.65620
@@ -604,47 +604,47 @@ <h2><span class="header-section-number">15.1</span> Deriving MLE<a href="ml.html
 ## Standard deviation     0.55389 0.51667 0.31915
 ## Proportion of Variance 0.03068 0.02669 0.01019
 ## Cumulative Proportion  0.96312 0.98981 1.00000</code></pre>
-<div class="sourceCode" id="cb252"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb252-1"><a href="ml.html#cb252-1" tabindex="-1"></a><span class="fu">autoplot</span>(my_pca, <span class="at">data =</span> X, <span class="at">loadings =</span> <span class="cn">TRUE</span>, <span class="at">loadings.colour =</span> <span class="st">&#39;blue&#39;</span>,</span>
-<span id="cb252-2"><a href="ml.html#cb252-2" tabindex="-1"></a>         <span class="at">loadings.label =</span> <span class="cn">TRUE</span>, <span class="at">loadings.label.size =</span> <span class="dv">3</span>)</span></code></pre></div>
-<p><img src="bookdown-pou_files/figure-html/unnamed-chunk-246-1.png" width="672" /></p>
-<div class="sourceCode" id="cb253"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb253-1"><a href="ml.html#cb253-1" tabindex="-1"></a>Sigma_est <span class="ot">&lt;-</span> (<span class="dv">1</span> <span class="sc">/</span> <span class="fu">nrow</span>(X_scaled)) <span class="sc">*</span> <span class="fu">t</span>(X_scaled) <span class="sc">%*%</span> X_scaled</span>
-<span id="cb253-2"><a href="ml.html#cb253-2" tabindex="-1"></a>Sigma_dec <span class="ot">&lt;-</span> <span class="fu">eigen</span>(Sigma_est)</span>
-<span id="cb253-3"><a href="ml.html#cb253-3" tabindex="-1"></a></span>
-<span id="cb253-4"><a href="ml.html#cb253-4" tabindex="-1"></a>Sigma_dec<span class="sc">$</span>vectors</span></code></pre></div>
+<div class="sourceCode" id="cb26"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb26-1"><a href="ml.html#cb26-1" aria-hidden="true" tabindex="-1"></a><span class="fu">autoplot</span>(my_pca, <span class="at">data =</span> X, <span class="at">loadings =</span> <span class="cn">TRUE</span>, <span class="at">loadings.colour =</span> <span class="st">&#39;blue&#39;</span>,</span>
+<span id="cb26-2"><a href="ml.html#cb26-2" aria-hidden="true" tabindex="-1"></a>         <span class="at">loadings.label =</span> <span class="cn">TRUE</span>, <span class="at">loadings.label.size =</span> <span class="dv">3</span>)</span></code></pre></div>
+<p><img src="bookdown-pou_files/figure-html/unnamed-chunk-14-1.png" width="672" /></p>
+<div class="sourceCode" id="cb27"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb27-1"><a href="ml.html#cb27-1" aria-hidden="true" tabindex="-1"></a>Sigma_est <span class="ot">&lt;-</span> (<span class="dv">1</span> <span class="sc">/</span> <span class="fu">nrow</span>(X_scaled)) <span class="sc">*</span> <span class="fu">t</span>(X_scaled) <span class="sc">%*%</span> X_scaled</span>
+<span id="cb27-2"><a href="ml.html#cb27-2" aria-hidden="true" tabindex="-1"></a>Sigma_dec <span class="ot">&lt;-</span> <span class="fu">eigen</span>(Sigma_est)</span>
+<span id="cb27-3"><a href="ml.html#cb27-3" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb27-4"><a href="ml.html#cb27-4" aria-hidden="true" tabindex="-1"></a>Sigma_dec<span class="sc">$</span>vectors</span></code></pre></div>
 <pre><code>##             [,1]       [,2]        [,3]        [,4]         [,5]        [,6]
-##  [1,]  0.4158823  0.1488081 -0.26747198 -0.08833244 -0.442314456  0.03071237
-##  [2,] -0.3940515 -0.1520815 -0.16894945 -0.24424963  0.368913901 -0.09378242
-##  [3,] -0.2691057  0.4835374  0.09853273 -0.10776276 -0.009754680  0.23002054
-##  [4,] -0.2122818  0.0278985 -0.85498656  0.38794393 -0.001876311  0.07454380
-##  [5,]  0.3558474  0.3521598 -0.18949642  0.08057457  0.146965351 -0.32692886
-##  [6,]  0.4334816  0.0695682 -0.12616012 -0.38229029 -0.088802794  0.21049130
-##  [7,] -0.1757923  0.5033347  0.04609969  0.02558404  0.019358607  0.61491241
-##  [8,] -0.3840821  0.1495820  0.13687235  0.14396548 -0.716743474 -0.34776037
-##  [9,] -0.1799436  0.3719570 -0.19232803 -0.60046566  0.095582043 -0.43744387
-## [10,]  0.1701426  0.4209653  0.22255233  0.48564231  0.339772188 -0.30032419
+##  [1,]  0.4158823  0.1488081 -0.26747198  0.08833244 -0.442314456  0.03071237
+##  [2,] -0.3940515 -0.1520815 -0.16894945  0.24424963  0.368913901 -0.09378242
+##  [3,] -0.2691057  0.4835374  0.09853273  0.10776276 -0.009754680  0.23002054
+##  [4,] -0.2122818  0.0278985 -0.85498656 -0.38794393 -0.001876311  0.07454380
+##  [5,]  0.3558474  0.3521598 -0.18949642 -0.08057457  0.146965351 -0.32692886
+##  [6,]  0.4334816  0.0695682 -0.12616012  0.38229029 -0.088802794  0.21049130
+##  [7,] -0.1757923  0.5033347  0.04609969 -0.02558404  0.019358607  0.61491241
+##  [8,] -0.3840821  0.1495820  0.13687235 -0.14396548 -0.716743474 -0.34776037
+##  [9,] -0.1799436  0.3719570 -0.19232803  0.60046566  0.095582043 -0.43744387
+## [10,]  0.1701426  0.4209653  0.22255233 -0.48564231  0.339772188 -0.30032419
 ##             [,7]         [,8]        [,9]       [,10]
-##  [1,]  0.2543985  0.663712826 -0.10839531  0.10948045
-##  [2,]  0.7505343  0.141264141  0.04613910  0.05580431
-##  [3,] -0.1106637  0.072505560  0.42247611  0.65073655
-##  [4,] -0.1351242 -0.155435871 -0.10206505  0.11941181
-##  [5,]  0.1413388 -0.146839303  0.65076229 -0.33681395
-##  [6,]  0.2725296 -0.639003579 -0.20723854  0.25971800
-##  [7,]  0.1439726  0.009400445 -0.16724055 -0.53450315
-##  [8,]  0.2732665 -0.276873049 -0.01766443 -0.06589572
-##  [9,] -0.3419099  0.058519366 -0.30619617 -0.13093187
-## [10,]  0.1868704  0.007310045 -0.45688227  0.24311846</code></pre>
-<div class="sourceCode" id="cb255"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb255-1"><a href="ml.html#cb255-1" tabindex="-1"></a>my_pca<span class="sc">$</span>rotation</span></code></pre></div>
+##  [1,]  0.2543985  0.663712826 -0.10839531 -0.10948045
+##  [2,]  0.7505343  0.141264141  0.04613910 -0.05580431
+##  [3,] -0.1106637  0.072505560  0.42247611 -0.65073655
+##  [4,] -0.1351242 -0.155435871 -0.10206505 -0.11941181
+##  [5,]  0.1413388 -0.146839303  0.65076229  0.33681395
+##  [6,]  0.2725296 -0.639003579 -0.20723854 -0.25971800
+##  [7,]  0.1439726  0.009400445 -0.16724055  0.53450315
+##  [8,]  0.2732665 -0.276873049 -0.01766443  0.06589572
+##  [9,] -0.3419099  0.058519366 -0.30619617  0.13093187
+## [10,]  0.1868704  0.007310045 -0.45688227 -0.24311846</code></pre>
+<div class="sourceCode" id="cb29"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb29-1"><a href="ml.html#cb29-1" aria-hidden="true" tabindex="-1"></a>my_pca<span class="sc">$</span>rotation</span></code></pre></div>
 <pre><code>##             PC1        PC2         PC3         PC4          PC5         PC6
-## 100  -0.4158823  0.1488081  0.26747198 -0.08833244 -0.442314456  0.03071237
-## long  0.3940515 -0.1520815  0.16894945 -0.24424963  0.368913901 -0.09378242
-## poid  0.2691057  0.4835374 -0.09853273 -0.10776276 -0.009754680  0.23002054
-## haut  0.2122818  0.0278985  0.85498656  0.38794393 -0.001876311  0.07454380
-## 400  -0.3558474  0.3521598  0.18949642  0.08057457  0.146965351 -0.32692886
-## 110  -0.4334816  0.0695682  0.12616012 -0.38229029 -0.088802794  0.21049130
-## disq  0.1757923  0.5033347 -0.04609969  0.02558404  0.019358607  0.61491241
-## perc  0.3840821  0.1495820 -0.13687235  0.14396548 -0.716743474 -0.34776037
-## jave  0.1799436  0.3719570  0.19232803 -0.60046566  0.095582043 -0.43744387
-## 1500 -0.1701426  0.4209653 -0.22255233  0.48564231  0.339772188 -0.30032419
+## 100  -0.4158823  0.1488081 -0.26747198  0.08833244 -0.442314456  0.03071237
+## long  0.3940515 -0.1520815 -0.16894945  0.24424963  0.368913901 -0.09378242
+## poid  0.2691057  0.4835374  0.09853273  0.10776276 -0.009754680  0.23002054
+## haut  0.2122818  0.0278985 -0.85498656 -0.38794393 -0.001876311  0.07454380
+## 400  -0.3558474  0.3521598 -0.18949642 -0.08057457  0.146965351 -0.32692886
+## 110  -0.4334816  0.0695682 -0.12616012  0.38229029 -0.088802794  0.21049130
+## disq  0.1757923  0.5033347  0.04609969 -0.02558404  0.019358607  0.61491241
+## perc  0.3840821  0.1495820  0.13687235 -0.14396548 -0.716743474 -0.34776037
+## jave  0.1799436  0.3719570 -0.19232803  0.60046566  0.095582043 -0.43744387
+## 1500 -0.1701426  0.4209653  0.22255233 -0.48564231  0.339772188 -0.30032419
 ##             PC7          PC8         PC9        PC10
 ## 100   0.2543985 -0.663712826  0.10839531 -0.10948045
 ## long  0.7505343 -0.141264141 -0.04613910 -0.05580431
@@ -657,11 +657,151 @@ <h2><span class="header-section-number">15.1</span> Deriving MLE<a href="ml.html
 ## jave -0.3419099 -0.058519366  0.30619617  0.13093187
 ## 1500  0.1868704 -0.007310045  0.45688227 -0.24311846</code></pre>
 </div>
+<div class="exercise">
+<p><span id="exr:unnamed-chunk-15" class="exercise"><strong>Exercise 15.6  (Classification) </strong></span>Let <span class="math inline">\(D = \{(x_i, y_i)\}_{i=1}^n\)</span> be a dataset of feature vectors and their corresponding integer class labels. We wish to classify feature vectors into correct classes.</p>
+<ol style="list-style-type: lower-alpha">
+<li>Choose a suitable probability distribution <span class="math inline">\(P_\theta(Y|X)\)</span> and write its log likelihood <span class="math inline">\(\ell\)</span>.</li>
+<li>Choose a differentiable function <span class="math inline">\(f_\phi\)</span> that predicts parameters <span class="math inline">\(\theta\)</span> from a feature vector, i.e. <span class="math inline">\(f_\phi(x_i) = \theta_i\)</span>.</li>
+<li><span style="color:blue">Load the <em>iris</em> dataset with <code>data(iris)</code> and split it into train and test subsets.</span></li>
+<li><span style="color:blue">Use gradient descent to find parameters <span class="math inline">\(\phi\)</span> that minimize the negative log likelihood on the <em>iris</em> dataset (equivalently: maximize the log likelihood). Reminder: gradient descent is an iterative optimization procedure <span class="math inline">\(\phi_{t+1} = \phi_t - \eta \nabla_\phi \ell\)</span>. Try <span class="math inline">\(\eta = 0.01\)</span> and run optimization for 30 steps. Compute the gradient with <code>numDeriv::grad</code>.</span></li>
+<li><span style="color:blue">Print the classification accuracy for the train and test subsets.</span></li>
+</ol>
+</div>
+<div class="fold">
+<div class="solution">
+<p><span id="unlabeled-div-4" class="solution"><em>Solution</em>. </span></p>
+<ol style="list-style-type: lower-alpha">
+<li>We pick the categorical distribution.</li>
+<li>Categorical distribution parameters are class probabilities that sum to 1. If there are <span class="math inline">\(m\)</span> classes, we can pick any differentiable function that takes as input a vector of features and predicts a vector of size <span class="math inline">\(m\)</span> whose elements are real numbers. We can then use a softmax transformation to map the predicted vector into one with non-negative entries that sum to 1. For simplicity, we can pick a linear transformation with <span class="math inline">\(\phi = (W, b)\)</span>, followed by softmax:
+<span class="math display">\[\begin{align*}
+f_\phi(x) &amp;= \textrm{softmax}(Wx + b), \\
+\textrm{softmax}(u)_i &amp;= \frac{\exp(u_i)}{\sum_{j=1}^m \exp(u_j)},
+  \end{align*}\]</span>
+where <span class="math inline">\(W \in \mathbb{R}^{d\times m}, b \in \mathbb{R}^m\)</span> and <span class="math inline">\(d\)</span> is the number of features.</li>
+</ol>
+</div>
+<div class="sourceCode" id="cb31"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb31-1"><a href="ml.html#cb31-1" aria-hidden="true" tabindex="-1"></a><span class="fu">data</span>(iris)</span>
+<span id="cb31-2"><a href="ml.html#cb31-2" aria-hidden="true" tabindex="-1"></a><span class="fu">head</span>(iris)</span></code></pre></div>
+<pre><code>##   Sepal.Length Sepal.Width Petal.Length Petal.Width Species
+## 1          5.1         3.5          1.4         0.2  setosa
+## 2          4.9         3.0          1.4         0.2  setosa
+## 3          4.7         3.2          1.3         0.2  setosa
+## 4          4.6         3.1          1.5         0.2  setosa
+## 5          5.0         3.6          1.4         0.2  setosa
+## 6          5.4         3.9          1.7         0.4  setosa</code></pre>
+<div class="sourceCode" id="cb33"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb33-1"><a href="ml.html#cb33-1" aria-hidden="true" tabindex="-1"></a><span class="co"># Model:</span></span>
+<span id="cb33-2"><a href="ml.html#cb33-2" aria-hidden="true" tabindex="-1"></a><span class="co"># y ~ Categorical(softmax(weights * features + bias))</span></span>
+<span id="cb33-3"><a href="ml.html#cb33-3" aria-hidden="true" tabindex="-1"></a><span class="co"># Want to maximize the (log) likelihood of y w.r.t. weights and bias.</span></span>
+<span id="cb33-4"><a href="ml.html#cb33-4" aria-hidden="true" tabindex="-1"></a><span class="co"># Need gradient of log likelihood w.r.t. weights and bias.</span></span>
+<span id="cb33-5"><a href="ml.html#cb33-5" aria-hidden="true" tabindex="-1"></a><span class="co"># Proceed by gradient descent on negative log likelihood.</span></span>
+<span id="cb33-6"><a href="ml.html#cb33-6" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb33-7"><a href="ml.html#cb33-7" aria-hidden="true" tabindex="-1"></a>weights <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="at">data=</span><span class="fu">rnorm</span>(<span class="dv">4</span> <span class="sc">*</span> <span class="dv">3</span>), <span class="at">nrow=</span><span class="dv">4</span>, <span class="at">ncol=</span><span class="dv">3</span>)</span>
+<span id="cb33-8"><a href="ml.html#cb33-8" aria-hidden="true" tabindex="-1"></a>bias <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="at">data=</span><span class="fu">rnorm</span>(<span class="dv">3</span>), <span class="at">nrow=</span><span class="dv">1</span>, <span class="at">ncol=</span><span class="dv">3</span>)</span>
+<span id="cb33-9"><a href="ml.html#cb33-9" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb33-10"><a href="ml.html#cb33-10" aria-hidden="true" tabindex="-1"></a>model <span class="ot">&lt;-</span> <span class="cf">function</span>(features, weights, bias) {</span>
+<span id="cb33-11"><a href="ml.html#cb33-11" aria-hidden="true" tabindex="-1"></a>  <span class="co"># parameters is a 5-element vector. First four are weights, last is bias.</span></span>
+<span id="cb33-12"><a href="ml.html#cb33-12" aria-hidden="true" tabindex="-1"></a>  <span class="fu">return</span>(<span class="fu">t</span>(features <span class="sc">%*%</span> weights <span class="sc">+</span> bias))</span>
+<span id="cb33-13"><a href="ml.html#cb33-13" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb33-14"><a href="ml.html#cb33-14" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb33-15"><a href="ml.html#cb33-15" aria-hidden="true" tabindex="-1"></a>softmax <span class="ot">&lt;-</span> <span class="cf">function</span>(v) {</span>
+<span id="cb33-16"><a href="ml.html#cb33-16" aria-hidden="true" tabindex="-1"></a>  <span class="fu">return</span>(<span class="fu">exp</span>(v) <span class="sc">/</span> <span class="fu">sum</span>(<span class="fu">exp</span>(v)))</span>
+<span id="cb33-17"><a href="ml.html#cb33-17" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb33-18"><a href="ml.html#cb33-18" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb33-19"><a href="ml.html#cb33-19" aria-hidden="true" tabindex="-1"></a>categorical_mass <span class="ot">&lt;-</span> <span class="cf">function</span>(targets, probs) {</span>
+<span id="cb33-20"><a href="ml.html#cb33-20" aria-hidden="true" tabindex="-1"></a>  <span class="co"># targets: matrix of size (n_data, n_classes) whose rows are one-hot vectors</span></span>
+<span id="cb33-21"><a href="ml.html#cb33-21" aria-hidden="true" tabindex="-1"></a>  <span class="co"># probs: matrix of size (n_data, n_classes) whose rows are class probabilities</span></span>
+<span id="cb33-22"><a href="ml.html#cb33-22" aria-hidden="true" tabindex="-1"></a>  <span class="fu">apply</span>(probs <span class="sc">*</span> targets, <span class="dv">1</span>, sum)</span>
+<span id="cb33-23"><a href="ml.html#cb33-23" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb33-24"><a href="ml.html#cb33-24" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb33-25"><a href="ml.html#cb33-25" aria-hidden="true" tabindex="-1"></a>predict_probs <span class="ot">&lt;-</span> <span class="cf">function</span>(features, model, parameters) {</span>
+<span id="cb33-26"><a href="ml.html#cb33-26" aria-hidden="true" tabindex="-1"></a>  weights <span class="ot">&lt;-</span> parameters[<span class="dv">1</span><span class="sc">:</span><span class="dv">4</span>, ]</span>
+<span id="cb33-27"><a href="ml.html#cb33-27" aria-hidden="true" tabindex="-1"></a>  bias <span class="ot">&lt;-</span> parameters[<span class="dv">5</span>, ]</span>
+<span id="cb33-28"><a href="ml.html#cb33-28" aria-hidden="true" tabindex="-1"></a>  u <span class="ot">&lt;-</span> <span class="fu">model</span>(features, weights, bias)</span>
+<span id="cb33-29"><a href="ml.html#cb33-29" aria-hidden="true" tabindex="-1"></a>  <span class="fu">apply</span>(u, <span class="dv">1</span>, softmax)</span>
+<span id="cb33-30"><a href="ml.html#cb33-30" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb33-31"><a href="ml.html#cb33-31" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb33-32"><a href="ml.html#cb33-32" aria-hidden="true" tabindex="-1"></a>accuracy <span class="ot">&lt;-</span> <span class="cf">function</span>(features, targets, model, parameters) {</span>
+<span id="cb33-33"><a href="ml.html#cb33-33" aria-hidden="true" tabindex="-1"></a>  probs <span class="ot">&lt;-</span> <span class="fu">predict_probs</span>(features, model, parameters)</span>
+<span id="cb33-34"><a href="ml.html#cb33-34" aria-hidden="true" tabindex="-1"></a>  argmax_mat <span class="ot">&lt;-</span> <span class="fu">t</span>(<span class="fu">apply</span>(probs, <span class="dv">1</span>, <span class="cf">function</span>(v) {v <span class="sc">==</span> <span class="fu">max</span>(v)}))</span>
+<span id="cb33-35"><a href="ml.html#cb33-35" aria-hidden="true" tabindex="-1"></a>  correct_predictions <span class="ot">&lt;-</span> <span class="fu">apply</span>(argmax_mat <span class="sc">*</span> targets, <span class="dv">1</span>, sum)</span>
+<span id="cb33-36"><a href="ml.html#cb33-36" aria-hidden="true" tabindex="-1"></a>  <span class="fu">return</span>(<span class="fu">mean</span>(correct_predictions))</span>
+<span id="cb33-37"><a href="ml.html#cb33-37" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb33-38"><a href="ml.html#cb33-38" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb33-39"><a href="ml.html#cb33-39" aria-hidden="true" tabindex="-1"></a>neg_log_lik <span class="ot">&lt;-</span> <span class="cf">function</span>(features, targets, model, parameters) {</span>
+<span id="cb33-40"><a href="ml.html#cb33-40" aria-hidden="true" tabindex="-1"></a>  probs <span class="ot">&lt;-</span> <span class="fu">predict_probs</span>(features, model, parameters)</span>
+<span id="cb33-41"><a href="ml.html#cb33-41" aria-hidden="true" tabindex="-1"></a>  <span class="sc">-</span><span class="fu">sum</span>(<span class="fu">log</span>(<span class="fu">categorical_mass</span>(targets, probs)))</span>
+<span id="cb33-42"><a href="ml.html#cb33-42" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb33-43"><a href="ml.html#cb33-43" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb33-44"><a href="ml.html#cb33-44" aria-hidden="true" tabindex="-1"></a>grad_neg_log_lik <span class="ot">&lt;-</span> <span class="cf">function</span>(features, targets, model, parameters){</span>
+<span id="cb33-45"><a href="ml.html#cb33-45" aria-hidden="true" tabindex="-1"></a>  numDeriv<span class="sc">::</span><span class="fu">grad</span>(<span class="cf">function</span>(par){<span class="fu">neg_log_lik</span>(features, targets, model, par)}, parameters)</span>
+<span id="cb33-46"><a href="ml.html#cb33-46" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb33-47"><a href="ml.html#cb33-47" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb33-48"><a href="ml.html#cb33-48" aria-hidden="true" tabindex="-1"></a>gradient_descent <span class="ot">&lt;-</span> <span class="cf">function</span>(initial_parameters, features, targets, <span class="at">step_size =</span> <span class="fl">0.01</span>, <span class="at">n_steps =</span> <span class="dv">30</span>) {</span>
+<span id="cb33-49"><a href="ml.html#cb33-49" aria-hidden="true" tabindex="-1"></a>  parameters <span class="ot">&lt;-</span> initial_parameters</span>
+<span id="cb33-50"><a href="ml.html#cb33-50" aria-hidden="true" tabindex="-1"></a>  <span class="cf">for</span> (i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>n_steps) {</span>
+<span id="cb33-51"><a href="ml.html#cb33-51" aria-hidden="true" tabindex="-1"></a>    <span class="fu">print</span>(<span class="fu">sprintf</span>(<span class="st">&quot;[%d] loss: %.4f, accuracy: %.2f&quot;</span>, i, <span class="fu">neg_log_lik</span>(features, targets, model, parameters), <span class="fu">accuracy</span>(features, targets, model, parameters)))</span>
+<span id="cb33-52"><a href="ml.html#cb33-52" aria-hidden="true" tabindex="-1"></a>    parameters <span class="ot">&lt;-</span> parameters <span class="sc">-</span> step_size <span class="sc">*</span> <span class="fu">grad_neg_log_lik</span>(features, targets, model, parameters)</span>
+<span id="cb33-53"><a href="ml.html#cb33-53" aria-hidden="true" tabindex="-1"></a>  }</span>
+<span id="cb33-54"><a href="ml.html#cb33-54" aria-hidden="true" tabindex="-1"></a>  <span class="fu">return</span>(parameters)</span>
+<span id="cb33-55"><a href="ml.html#cb33-55" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb33-56"><a href="ml.html#cb33-56" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb33-57"><a href="ml.html#cb33-57" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb33-58"><a href="ml.html#cb33-58" aria-hidden="true" tabindex="-1"></a>x <span class="ot">&lt;-</span> <span class="fu">as.matrix</span>(<span class="fu">subset</span>(iris, <span class="at">select=</span><span class="sc">-</span><span class="fu">c</span>(Species)))</span>
+<span id="cb33-59"><a href="ml.html#cb33-59" aria-hidden="true" tabindex="-1"></a>y <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="at">nrow=</span><span class="fu">nrow</span>(iris), <span class="at">ncol=</span><span class="dv">3</span>)</span>
+<span id="cb33-60"><a href="ml.html#cb33-60" aria-hidden="true" tabindex="-1"></a>y[, <span class="dv">1</span>] <span class="ot">&lt;-</span> iris<span class="sc">$</span>Species <span class="sc">==</span> <span class="st">&quot;setosa&quot;</span></span>
+<span id="cb33-61"><a href="ml.html#cb33-61" aria-hidden="true" tabindex="-1"></a>y[, <span class="dv">2</span>] <span class="ot">&lt;-</span> iris<span class="sc">$</span>Species <span class="sc">==</span> <span class="st">&quot;versicolor&quot;</span></span>
+<span id="cb33-62"><a href="ml.html#cb33-62" aria-hidden="true" tabindex="-1"></a>y[, <span class="dv">3</span>] <span class="ot">&lt;-</span> iris<span class="sc">$</span>Species <span class="sc">==</span> <span class="st">&quot;virginica&quot;</span></span>
+<span id="cb33-63"><a href="ml.html#cb33-63" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb33-64"><a href="ml.html#cb33-64" aria-hidden="true" tabindex="-1"></a><span class="co"># Take an equal number of representatives for every class for the training and test subsets</span></span>
+<span id="cb33-65"><a href="ml.html#cb33-65" aria-hidden="true" tabindex="-1"></a><span class="co"># Note: code is written so that shuffling does not matter during optimization</span></span>
+<span id="cb33-66"><a href="ml.html#cb33-66" aria-hidden="true" tabindex="-1"></a>x_train <span class="ot">&lt;-</span> x[<span class="fu">c</span>(<span class="dv">1</span><span class="sc">:</span><span class="dv">35</span>, <span class="dv">51</span><span class="sc">:</span><span class="dv">85</span>, <span class="dv">101</span><span class="sc">:</span><span class="dv">135</span>), ]</span>
+<span id="cb33-67"><a href="ml.html#cb33-67" aria-hidden="true" tabindex="-1"></a>y_train <span class="ot">&lt;-</span> y[<span class="fu">c</span>(<span class="dv">1</span><span class="sc">:</span><span class="dv">35</span>, <span class="dv">51</span><span class="sc">:</span><span class="dv">85</span>, <span class="dv">101</span><span class="sc">:</span><span class="dv">135</span>), ]</span>
+<span id="cb33-68"><a href="ml.html#cb33-68" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb33-69"><a href="ml.html#cb33-69" aria-hidden="true" tabindex="-1"></a>x_test <span class="ot">&lt;-</span> x[<span class="sc">-</span><span class="fu">c</span>(<span class="dv">1</span><span class="sc">:</span><span class="dv">35</span>, <span class="dv">51</span><span class="sc">:</span><span class="dv">85</span>, <span class="dv">101</span><span class="sc">:</span><span class="dv">135</span>), ]</span>
+<span id="cb33-70"><a href="ml.html#cb33-70" aria-hidden="true" tabindex="-1"></a>y_test <span class="ot">&lt;-</span> y[<span class="sc">-</span><span class="fu">c</span>(<span class="dv">1</span><span class="sc">:</span><span class="dv">35</span>, <span class="dv">51</span><span class="sc">:</span><span class="dv">85</span>, <span class="dv">101</span><span class="sc">:</span><span class="dv">135</span>), ]</span>
+<span id="cb33-71"><a href="ml.html#cb33-71" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb33-72"><a href="ml.html#cb33-72" aria-hidden="true" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">0</span>)</span>
+<span id="cb33-73"><a href="ml.html#cb33-73" aria-hidden="true" tabindex="-1"></a>optimized_parameters <span class="ot">&lt;-</span> <span class="fu">gradient_descent</span>(<span class="fu">rbind</span>(weights, bias), x_train, y_train)</span></code></pre></div>
+<pre><code>## [1] &quot;[1] loss: 687.3208, accuracy: 0.02&quot;
+## [1] &quot;[2] loss: 452.4356, accuracy: 0.66&quot;
+## [1] &quot;[3] loss: 429.3215, accuracy: 0.92&quot;
+## [1] &quot;[4] loss: 427.2969, accuracy: 0.93&quot;
+## [1] &quot;[5] loss: 425.9729, accuracy: 0.93&quot;
+## [1] &quot;[6] loss: 424.9825, accuracy: 0.95&quot;
+## [1] &quot;[7] loss: 424.1846, accuracy: 0.95&quot;
+## [1] &quot;[8] loss: 423.5169, accuracy: 0.95&quot;
+## [1] &quot;[9] loss: 422.9466, accuracy: 0.95&quot;
+## [1] &quot;[10] loss: 422.4535, accuracy: 0.94&quot;
+## [1] &quot;[11] loss: 422.0234, accuracy: 0.94&quot;
+## [1] &quot;[12] loss: 421.6456, accuracy: 0.93&quot;
+## [1] &quot;[13] loss: 421.3116, accuracy: 0.92&quot;
+## [1] &quot;[14] loss: 421.0144, accuracy: 0.92&quot;
+## [1] &quot;[15] loss: 420.7485, accuracy: 0.92&quot;
+## [1] &quot;[16] loss: 420.5091, accuracy: 0.92&quot;
+## [1] &quot;[17] loss: 420.2926, accuracy: 0.92&quot;
+## [1] &quot;[18] loss: 420.0955, accuracy: 0.92&quot;
+## [1] &quot;[19] loss: 419.9153, accuracy: 0.92&quot;
+## [1] &quot;[20] loss: 419.7498, accuracy: 0.92&quot;
+## [1] &quot;[21] loss: 419.5969, accuracy: 0.92&quot;
+## [1] &quot;[22] loss: 419.4552, accuracy: 0.92&quot;
+## [1] &quot;[23] loss: 419.3233, accuracy: 0.92&quot;
+## [1] &quot;[24] loss: 419.2000, accuracy: 0.92&quot;
+## [1] &quot;[25] loss: 419.0843, accuracy: 0.92&quot;
+## [1] &quot;[26] loss: 418.9755, accuracy: 0.92&quot;
+## [1] &quot;[27] loss: 418.8727, accuracy: 0.92&quot;
+## [1] &quot;[28] loss: 418.7754, accuracy: 0.92&quot;
+## [1] &quot;[29] loss: 418.6831, accuracy: 0.92&quot;
+## [1] &quot;[30] loss: 418.5952, accuracy: 0.92&quot;</code></pre>
+<div class="sourceCode" id="cb35"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb35-1"><a href="ml.html#cb35-1" aria-hidden="true" tabindex="-1"></a><span class="fu">accuracy</span>(x_train, y_train, model, optimized_parameters)</span></code></pre></div>
+<pre><code>## [1] 0.9238095</code></pre>
+<div class="sourceCode" id="cb37"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb37-1"><a href="ml.html#cb37-1" aria-hidden="true" tabindex="-1"></a><span class="fu">accuracy</span>(x_test, y_test, model, optimized_parameters)</span></code></pre></div>
+<pre><code>## [1] 0.9555556</code></pre>
+</div>
 </div>
 <div id="fisher-information" class="section level2 hasAnchor" number="15.2">
 <h2><span class="header-section-number">15.2</span> Fisher information<a href="ml.html#fisher-information" class="anchor-section" aria-label="Anchor link to header"></a></h2>
 <div class="exercise">
-<p><span id="exr:unnamed-chunk-247" class="exercise"><strong>Exercise 15.6  </strong></span>Let us assume a Poisson likelihood.</p>
+<p><span id="exr:unnamed-chunk-18" class="exercise"><strong>Exercise 15.7  </strong></span>Let us assume a Poisson likelihood.</p>
 <ol style="list-style-type: lower-alpha">
 <li><p>Derive the MLE estimate of the mean.</p></li>
 <li><p>Derive the Fisher information.</p></li>
@@ -669,10 +809,10 @@ <h2><span class="header-section-number">15.2</span> Fisher information<a href="m
 <li><p><span style="color:blue">Use bootstrap to construct the CI for the mean. Compare with c) and discuss.</span></p></li>
 </ol>
 </div>
-<div class="sourceCode" id="cb257"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb257-1"><a href="ml.html#cb257-1" tabindex="-1"></a>x <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">2</span>, <span class="dv">5</span>, <span class="dv">3</span>, <span class="dv">1</span>, <span class="dv">2</span>, <span class="dv">1</span>, <span class="dv">0</span>, <span class="dv">3</span>, <span class="dv">0</span>, <span class="dv">2</span>)</span></code></pre></div>
+<div class="sourceCode" id="cb39"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb39-1"><a href="ml.html#cb39-1" aria-hidden="true" tabindex="-1"></a>x <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">2</span>, <span class="dv">5</span>, <span class="dv">3</span>, <span class="dv">1</span>, <span class="dv">2</span>, <span class="dv">1</span>, <span class="dv">0</span>, <span class="dv">3</span>, <span class="dv">0</span>, <span class="dv">2</span>)</span></code></pre></div>
 <div class="fold">
 <div class="solution">
-<p><span id="unlabeled-div-91" class="solution"><em>Solution</em>. </span></p>
+<p><span id="unlabeled-div-5" class="solution"><em>Solution</em>. </span></p>
 <ol style="list-style-type: lower-alpha">
 <li><p>The log likelihood of the Poisson is
 <span class="math display">\[\begin{align*}
@@ -696,28 +836,28 @@ <h2><span class="header-section-number">15.2</span> Fisher information<a href="m
   &amp;= \frac{n}{\lambda}.
 \end{align*}\]</span></p>
 </div>
-<div class="sourceCode" id="cb258"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb258-1"><a href="ml.html#cb258-1" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">1</span>)</span>
-<span id="cb258-2"><a href="ml.html#cb258-2" tabindex="-1"></a>x          <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">2</span>, <span class="dv">5</span>, <span class="dv">3</span>, <span class="dv">1</span>, <span class="dv">2</span>, <span class="dv">1</span>, <span class="dv">0</span>, <span class="dv">3</span>, <span class="dv">0</span>, <span class="dv">2</span>)</span>
-<span id="cb258-3"><a href="ml.html#cb258-3" tabindex="-1"></a>lambda_hat <span class="ot">&lt;-</span> <span class="fu">mean</span>(x)</span>
-<span id="cb258-4"><a href="ml.html#cb258-4" tabindex="-1"></a>finfo      <span class="ot">&lt;-</span> <span class="fu">length</span>(x) <span class="sc">/</span> lambda_hat</span>
-<span id="cb258-5"><a href="ml.html#cb258-5" tabindex="-1"></a>mle_CI     <span class="ot">&lt;-</span> <span class="fu">c</span>(lambda_hat <span class="sc">-</span> <span class="fl">1.96</span> <span class="sc">*</span> <span class="fu">sqrt</span>(<span class="dv">1</span> <span class="sc">/</span> finfo),</span>
-<span id="cb258-6"><a href="ml.html#cb258-6" tabindex="-1"></a>                lambda_hat <span class="sc">+</span> <span class="fl">1.96</span> <span class="sc">*</span> <span class="fu">sqrt</span>(<span class="dv">1</span> <span class="sc">/</span> finfo))</span>
-<span id="cb258-7"><a href="ml.html#cb258-7" tabindex="-1"></a>boot_lambda <span class="ot">&lt;-</span> <span class="fu">c</span>()</span>
-<span id="cb258-8"><a href="ml.html#cb258-8" tabindex="-1"></a>nboot       <span class="ot">&lt;-</span> <span class="dv">1000</span></span>
-<span id="cb258-9"><a href="ml.html#cb258-9" tabindex="-1"></a><span class="cf">for</span> (i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>nboot) {</span>
-<span id="cb258-10"><a href="ml.html#cb258-10" tabindex="-1"></a>  tmp_x          <span class="ot">&lt;-</span> <span class="fu">sample</span>(x, <span class="fu">length</span>(x), <span class="at">replace =</span> T)</span>
-<span id="cb258-11"><a href="ml.html#cb258-11" tabindex="-1"></a>  boot_lambda[i] <span class="ot">&lt;-</span> <span class="fu">mean</span>(tmp_x)</span>
-<span id="cb258-12"><a href="ml.html#cb258-12" tabindex="-1"></a>}</span>
-<span id="cb258-13"><a href="ml.html#cb258-13" tabindex="-1"></a>boot_CI <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="fu">quantile</span>(boot_lambda, <span class="fl">0.025</span>),</span>
-<span id="cb258-14"><a href="ml.html#cb258-14" tabindex="-1"></a>             <span class="fu">quantile</span>(boot_lambda, <span class="fl">0.975</span>))</span>
-<span id="cb258-15"><a href="ml.html#cb258-15" tabindex="-1"></a>mle_CI</span></code></pre></div>
+<div class="sourceCode" id="cb40"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb40-1"><a href="ml.html#cb40-1" aria-hidden="true" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">1</span>)</span>
+<span id="cb40-2"><a href="ml.html#cb40-2" aria-hidden="true" tabindex="-1"></a>x          <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">2</span>, <span class="dv">5</span>, <span class="dv">3</span>, <span class="dv">1</span>, <span class="dv">2</span>, <span class="dv">1</span>, <span class="dv">0</span>, <span class="dv">3</span>, <span class="dv">0</span>, <span class="dv">2</span>)</span>
+<span id="cb40-3"><a href="ml.html#cb40-3" aria-hidden="true" tabindex="-1"></a>lambda_hat <span class="ot">&lt;-</span> <span class="fu">mean</span>(x)</span>
+<span id="cb40-4"><a href="ml.html#cb40-4" aria-hidden="true" tabindex="-1"></a>finfo      <span class="ot">&lt;-</span> <span class="fu">length</span>(x) <span class="sc">/</span> lambda_hat</span>
+<span id="cb40-5"><a href="ml.html#cb40-5" aria-hidden="true" tabindex="-1"></a>mle_CI     <span class="ot">&lt;-</span> <span class="fu">c</span>(lambda_hat <span class="sc">-</span> <span class="fl">1.96</span> <span class="sc">*</span> <span class="fu">sqrt</span>(<span class="dv">1</span> <span class="sc">/</span> finfo),</span>
+<span id="cb40-6"><a href="ml.html#cb40-6" aria-hidden="true" tabindex="-1"></a>                lambda_hat <span class="sc">+</span> <span class="fl">1.96</span> <span class="sc">*</span> <span class="fu">sqrt</span>(<span class="dv">1</span> <span class="sc">/</span> finfo))</span>
+<span id="cb40-7"><a href="ml.html#cb40-7" aria-hidden="true" tabindex="-1"></a>boot_lambda <span class="ot">&lt;-</span> <span class="fu">c</span>()</span>
+<span id="cb40-8"><a href="ml.html#cb40-8" aria-hidden="true" tabindex="-1"></a>nboot       <span class="ot">&lt;-</span> <span class="dv">1000</span></span>
+<span id="cb40-9"><a href="ml.html#cb40-9" aria-hidden="true" tabindex="-1"></a><span class="cf">for</span> (i <span class="cf">in</span> <span class="dv">1</span><span class="sc">:</span>nboot) {</span>
+<span id="cb40-10"><a href="ml.html#cb40-10" aria-hidden="true" tabindex="-1"></a>  tmp_x          <span class="ot">&lt;-</span> <span class="fu">sample</span>(x, <span class="fu">length</span>(x), <span class="at">replace =</span> T)</span>
+<span id="cb40-11"><a href="ml.html#cb40-11" aria-hidden="true" tabindex="-1"></a>  boot_lambda[i] <span class="ot">&lt;-</span> <span class="fu">mean</span>(tmp_x)</span>
+<span id="cb40-12"><a href="ml.html#cb40-12" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb40-13"><a href="ml.html#cb40-13" aria-hidden="true" tabindex="-1"></a>boot_CI <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="fu">quantile</span>(boot_lambda, <span class="fl">0.025</span>),</span>
+<span id="cb40-14"><a href="ml.html#cb40-14" aria-hidden="true" tabindex="-1"></a>             <span class="fu">quantile</span>(boot_lambda, <span class="fl">0.975</span>))</span>
+<span id="cb40-15"><a href="ml.html#cb40-15" aria-hidden="true" tabindex="-1"></a>mle_CI</span></code></pre></div>
 <pre><code>## [1] 1.045656 2.754344</code></pre>
-<div class="sourceCode" id="cb260"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb260-1"><a href="ml.html#cb260-1" tabindex="-1"></a>boot_CI</span></code></pre></div>
+<div class="sourceCode" id="cb42"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb42-1"><a href="ml.html#cb42-1" aria-hidden="true" tabindex="-1"></a>boot_CI</span></code></pre></div>
 <pre><code>##  2.5% 97.5% 
 ##   1.0   2.7</code></pre>
 </div>
 <div class="exercise">
-<p><span id="exr:unnamed-chunk-251" class="exercise"><strong>Exercise 15.7  </strong></span></p>
+<p><span id="exr:unnamed-chunk-22" class="exercise"><strong>Exercise 15.8  </strong></span></p>
 <ol style="list-style-type: lower-alpha">
 <li><p>Find the Fisher information matrix for the Gamma distribution.</p></li>
 <li><p><span style="color:blue">Generate 20 samples from a Gamma distribution and plot a confidence ellipse of the inverse of Fisher information matrix around the ML estimates of the parameters. Also plot the theoretical values. Repeat the sampling several times. What do you observe?</span></p></li>
@@ -727,7 +867,7 @@ <h2><span class="header-section-number">15.2</span> Fisher information<a href="m
 </div>
 <div class="fold">
 <div class="solution">
-<p><span id="unlabeled-div-92" class="solution"><em>Solution</em>. </span></p>
+<p><span id="unlabeled-div-6" class="solution"><em>Solution</em>. </span></p>
 <ol style="list-style-type: lower-alpha">
 <li>The log likelihood of the Gamma is
 <span class="math display">\[\begin{equation*}
@@ -761,50 +901,113 @@ <h2><span class="header-section-number">15.2</span> Fisher information<a href="m
 <li>A non-diagonal Fisher matrix implies that the parameter estimates are linearly dependent.</li>
 </ol>
 </div>
-<div class="sourceCode" id="cb262"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb262-1"><a href="ml.html#cb262-1" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">1</span>)</span>
-<span id="cb262-2"><a href="ml.html#cb262-2" tabindex="-1"></a>n  <span class="ot">&lt;-</span> <span class="dv">20</span></span>
-<span id="cb262-3"><a href="ml.html#cb262-3" tabindex="-1"></a>pars_theor <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">5</span>, <span class="dv">2</span>)</span>
-<span id="cb262-4"><a href="ml.html#cb262-4" tabindex="-1"></a>x  <span class="ot">&lt;-</span> <span class="fu">rgamma</span>(n, <span class="dv">5</span>, <span class="dv">2</span>)</span>
-<span id="cb262-5"><a href="ml.html#cb262-5" tabindex="-1"></a></span>
-<span id="cb262-6"><a href="ml.html#cb262-6" tabindex="-1"></a></span>
-<span id="cb262-7"><a href="ml.html#cb262-7" tabindex="-1"></a><span class="co"># MLE for alpha and beta</span></span>
-<span id="cb262-8"><a href="ml.html#cb262-8" tabindex="-1"></a>log_lik <span class="ot">&lt;-</span> <span class="cf">function</span> (pars, x) {</span>
-<span id="cb262-9"><a href="ml.html#cb262-9" tabindex="-1"></a>  n <span class="ot">&lt;-</span> <span class="fu">length</span>(x)</span>
-<span id="cb262-10"><a href="ml.html#cb262-10" tabindex="-1"></a>  <span class="fu">return</span> (<span class="sc">-</span> (n <span class="sc">*</span> pars[<span class="dv">1</span>] <span class="sc">*</span> <span class="fu">log</span>(pars[<span class="dv">2</span>]) <span class="sc">-</span></span>
-<span id="cb262-11"><a href="ml.html#cb262-11" tabindex="-1"></a>             n <span class="sc">*</span> <span class="fu">log</span>(<span class="fu">gamma</span>(pars[<span class="dv">1</span>])) <span class="sc">+</span></span>
-<span id="cb262-12"><a href="ml.html#cb262-12" tabindex="-1"></a>             (pars[<span class="dv">1</span>] <span class="sc">-</span> <span class="dv">1</span>) <span class="sc">*</span> <span class="fu">sum</span>(<span class="fu">log</span>(x)) <span class="sc">-</span></span>
-<span id="cb262-13"><a href="ml.html#cb262-13" tabindex="-1"></a>             pars[<span class="dv">2</span>] <span class="sc">*</span> <span class="fu">sum</span>(x)))</span>
-<span id="cb262-14"><a href="ml.html#cb262-14" tabindex="-1"></a>}</span>
-<span id="cb262-15"><a href="ml.html#cb262-15" tabindex="-1"></a>my_optim <span class="ot">&lt;-</span> <span class="fu">optim</span>(<span class="at">par =</span> <span class="fu">c</span>(<span class="dv">1</span>,<span class="dv">1</span>), <span class="at">fn =</span> log_lik, <span class="at">method =</span> <span class="st">&quot;L-BFGS-B&quot;</span>,</span>
-<span id="cb262-16"><a href="ml.html#cb262-16" tabindex="-1"></a>                  <span class="at">lower =</span> <span class="fu">c</span>(<span class="fl">0.001</span>, <span class="fl">0.001</span>), <span class="at">upper =</span> <span class="fu">c</span>(<span class="dv">8</span>, <span class="dv">8</span>), <span class="at">x =</span> x)</span>
-<span id="cb262-17"><a href="ml.html#cb262-17" tabindex="-1"></a>pars_mle <span class="ot">&lt;-</span> my_optim<span class="sc">$</span>par</span>
-<span id="cb262-18"><a href="ml.html#cb262-18" tabindex="-1"></a></span>
-<span id="cb262-19"><a href="ml.html#cb262-19" tabindex="-1"></a>fish_mat <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="at">data =</span> <span class="cn">NA</span>, <span class="at">nrow =</span> <span class="dv">2</span>, <span class="at">ncol =</span> <span class="dv">2</span>)</span>
-<span id="cb262-20"><a href="ml.html#cb262-20" tabindex="-1"></a>fish_mat[<span class="dv">1</span>,<span class="dv">2</span>] <span class="ot">&lt;-</span> <span class="sc">-</span> n <span class="sc">/</span> pars_mle[<span class="dv">2</span>]</span>
-<span id="cb262-21"><a href="ml.html#cb262-21" tabindex="-1"></a>fish_mat[<span class="dv">2</span>,<span class="dv">1</span>] <span class="ot">&lt;-</span> <span class="sc">-</span> n <span class="sc">/</span> pars_mle[<span class="dv">2</span>]</span>
-<span id="cb262-22"><a href="ml.html#cb262-22" tabindex="-1"></a>fish_mat[<span class="dv">2</span>,<span class="dv">2</span>] <span class="ot">&lt;-</span> (n <span class="sc">*</span> pars_mle[<span class="dv">1</span>]) <span class="sc">/</span> (pars_mle[<span class="dv">2</span>]<span class="sc">^</span><span class="dv">2</span>)</span>
-<span id="cb262-23"><a href="ml.html#cb262-23" tabindex="-1"></a>fish_mat[<span class="dv">1</span>,<span class="dv">1</span>] <span class="ot">&lt;-</span> n <span class="sc">*</span> <span class="fu">grad</span>(digamma, pars_mle[<span class="dv">1</span>])</span>
-<span id="cb262-24"><a href="ml.html#cb262-24" tabindex="-1"></a></span>
-<span id="cb262-25"><a href="ml.html#cb262-25" tabindex="-1"></a>fish_mat_inv <span class="ot">&lt;-</span> <span class="fu">solve</span>(fish_mat)</span>
-<span id="cb262-26"><a href="ml.html#cb262-26" tabindex="-1"></a></span>
-<span id="cb262-27"><a href="ml.html#cb262-27" tabindex="-1"></a>est_ellip <span class="ot">&lt;-</span> <span class="fu">ellipse</span>(pars_mle, fish_mat_inv, <span class="at">draw =</span> <span class="cn">FALSE</span>)</span>
-<span id="cb262-28"><a href="ml.html#cb262-28" tabindex="-1"></a><span class="fu">colnames</span>(est_ellip) <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="st">&quot;X1&quot;</span>, <span class="st">&quot;X2&quot;</span>)</span>
-<span id="cb262-29"><a href="ml.html#cb262-29" tabindex="-1"></a>est_ellip <span class="ot">&lt;-</span> <span class="fu">as.data.frame</span>(est_ellip)</span>
-<span id="cb262-30"><a href="ml.html#cb262-30" tabindex="-1"></a></span>
-<span id="cb262-31"><a href="ml.html#cb262-31" tabindex="-1"></a><span class="fu">ggplot</span>() <span class="sc">+</span></span>
-<span id="cb262-32"><a href="ml.html#cb262-32" tabindex="-1"></a>  <span class="fu">geom_point</span>(<span class="at">data =</span> <span class="fu">data.frame</span>(<span class="at">x =</span> pars_mle[<span class="dv">1</span>], <span class="at">y =</span> pars_mle[<span class="dv">2</span>]), <span class="fu">aes</span>(<span class="at">x =</span> x, <span class="at">y =</span> y)) <span class="sc">+</span></span>
-<span id="cb262-33"><a href="ml.html#cb262-33" tabindex="-1"></a>  <span class="fu">geom_path</span>(<span class="at">data =</span> est_ellip, <span class="fu">aes</span>(<span class="at">x =</span> X1, <span class="at">y =</span> X2)) <span class="sc">+</span></span>
-<span id="cb262-34"><a href="ml.html#cb262-34" tabindex="-1"></a>  <span class="fu">geom_point</span>(<span class="fu">aes</span>(<span class="at">x =</span> pars_theor[<span class="dv">1</span>], <span class="at">y =</span> pars_theor[<span class="dv">2</span>]), <span class="at">color =</span> <span class="st">&quot;red&quot;</span>) <span class="sc">+</span></span>
-<span id="cb262-35"><a href="ml.html#cb262-35" tabindex="-1"></a>  <span class="fu">geom_text</span>(<span class="fu">aes</span>(<span class="at">x =</span> pars_theor[<span class="dv">1</span>], <span class="at">y =</span> pars_theor[<span class="dv">2</span>], <span class="at">label =</span> <span class="st">&quot;Theoretical parameters&quot;</span>), </span>
-<span id="cb262-36"><a href="ml.html#cb262-36" tabindex="-1"></a>            <span class="at">color =</span> <span class="st">&quot;red&quot;</span>,</span>
-<span id="cb262-37"><a href="ml.html#cb262-37" tabindex="-1"></a>            <span class="at">nudge_y =</span> <span class="sc">-</span><span class="fl">0.2</span>)</span></code></pre></div>
-<p><img src="bookdown-pou_files/figure-html/unnamed-chunk-253-1.png" width="672" /></p>
+<div class="sourceCode" id="cb44"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb44-1"><a href="ml.html#cb44-1" aria-hidden="true" tabindex="-1"></a><span class="fu">set.seed</span>(<span class="dv">1</span>)</span>
+<span id="cb44-2"><a href="ml.html#cb44-2" aria-hidden="true" tabindex="-1"></a>n  <span class="ot">&lt;-</span> <span class="dv">20</span></span>
+<span id="cb44-3"><a href="ml.html#cb44-3" aria-hidden="true" tabindex="-1"></a>pars_theor <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="dv">5</span>, <span class="dv">2</span>)</span>
+<span id="cb44-4"><a href="ml.html#cb44-4" aria-hidden="true" tabindex="-1"></a>x  <span class="ot">&lt;-</span> <span class="fu">rgamma</span>(n, <span class="dv">5</span>, <span class="dv">2</span>)</span>
+<span id="cb44-5"><a href="ml.html#cb44-5" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb44-6"><a href="ml.html#cb44-6" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb44-7"><a href="ml.html#cb44-7" aria-hidden="true" tabindex="-1"></a><span class="co"># MLE for alpha and beta</span></span>
+<span id="cb44-8"><a href="ml.html#cb44-8" aria-hidden="true" tabindex="-1"></a>log_lik <span class="ot">&lt;-</span> <span class="cf">function</span> (pars, x) {</span>
+<span id="cb44-9"><a href="ml.html#cb44-9" aria-hidden="true" tabindex="-1"></a>  n <span class="ot">&lt;-</span> <span class="fu">length</span>(x)</span>
+<span id="cb44-10"><a href="ml.html#cb44-10" aria-hidden="true" tabindex="-1"></a>  <span class="fu">return</span> (<span class="sc">-</span> (n <span class="sc">*</span> pars[<span class="dv">1</span>] <span class="sc">*</span> <span class="fu">log</span>(pars[<span class="dv">2</span>]) <span class="sc">-</span></span>
+<span id="cb44-11"><a href="ml.html#cb44-11" aria-hidden="true" tabindex="-1"></a>             n <span class="sc">*</span> <span class="fu">log</span>(<span class="fu">gamma</span>(pars[<span class="dv">1</span>])) <span class="sc">+</span></span>
+<span id="cb44-12"><a href="ml.html#cb44-12" aria-hidden="true" tabindex="-1"></a>             (pars[<span class="dv">1</span>] <span class="sc">-</span> <span class="dv">1</span>) <span class="sc">*</span> <span class="fu">sum</span>(<span class="fu">log</span>(x)) <span class="sc">-</span></span>
+<span id="cb44-13"><a href="ml.html#cb44-13" aria-hidden="true" tabindex="-1"></a>             pars[<span class="dv">2</span>] <span class="sc">*</span> <span class="fu">sum</span>(x)))</span>
+<span id="cb44-14"><a href="ml.html#cb44-14" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb44-15"><a href="ml.html#cb44-15" aria-hidden="true" tabindex="-1"></a>my_optim <span class="ot">&lt;-</span> <span class="fu">optim</span>(<span class="at">par =</span> <span class="fu">c</span>(<span class="dv">1</span>,<span class="dv">1</span>), <span class="at">fn =</span> log_lik, <span class="at">method =</span> <span class="st">&quot;L-BFGS-B&quot;</span>,</span>
+<span id="cb44-16"><a href="ml.html#cb44-16" aria-hidden="true" tabindex="-1"></a>                  <span class="at">lower =</span> <span class="fu">c</span>(<span class="fl">0.001</span>, <span class="fl">0.001</span>), <span class="at">upper =</span> <span class="fu">c</span>(<span class="dv">8</span>, <span class="dv">8</span>), <span class="at">x =</span> x)</span>
+<span id="cb44-17"><a href="ml.html#cb44-17" aria-hidden="true" tabindex="-1"></a>pars_mle <span class="ot">&lt;-</span> my_optim<span class="sc">$</span>par</span>
+<span id="cb44-18"><a href="ml.html#cb44-18" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb44-19"><a href="ml.html#cb44-19" aria-hidden="true" tabindex="-1"></a>fish_mat <span class="ot">&lt;-</span> <span class="fu">matrix</span>(<span class="at">data =</span> <span class="cn">NA</span>, <span class="at">nrow =</span> <span class="dv">2</span>, <span class="at">ncol =</span> <span class="dv">2</span>)</span>
+<span id="cb44-20"><a href="ml.html#cb44-20" aria-hidden="true" tabindex="-1"></a>fish_mat[<span class="dv">1</span>,<span class="dv">2</span>] <span class="ot">&lt;-</span> <span class="sc">-</span> n <span class="sc">/</span> pars_mle[<span class="dv">2</span>]</span>
+<span id="cb44-21"><a href="ml.html#cb44-21" aria-hidden="true" tabindex="-1"></a>fish_mat[<span class="dv">2</span>,<span class="dv">1</span>] <span class="ot">&lt;-</span> <span class="sc">-</span> n <span class="sc">/</span> pars_mle[<span class="dv">2</span>]</span>
+<span id="cb44-22"><a href="ml.html#cb44-22" aria-hidden="true" tabindex="-1"></a>fish_mat[<span class="dv">2</span>,<span class="dv">2</span>] <span class="ot">&lt;-</span> (n <span class="sc">*</span> pars_mle[<span class="dv">1</span>]) <span class="sc">/</span> (pars_mle[<span class="dv">2</span>]<span class="sc">^</span><span class="dv">2</span>)</span>
+<span id="cb44-23"><a href="ml.html#cb44-23" aria-hidden="true" tabindex="-1"></a>fish_mat[<span class="dv">1</span>,<span class="dv">1</span>] <span class="ot">&lt;-</span> n <span class="sc">*</span> <span class="fu">grad</span>(digamma, pars_mle[<span class="dv">1</span>])</span>
+<span id="cb44-24"><a href="ml.html#cb44-24" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb44-25"><a href="ml.html#cb44-25" aria-hidden="true" tabindex="-1"></a>fish_mat_inv <span class="ot">&lt;-</span> <span class="fu">solve</span>(fish_mat)</span>
+<span id="cb44-26"><a href="ml.html#cb44-26" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb44-27"><a href="ml.html#cb44-27" aria-hidden="true" tabindex="-1"></a>est_ellip <span class="ot">&lt;-</span> <span class="fu">ellipse</span>(pars_mle, fish_mat_inv, <span class="at">draw =</span> <span class="cn">FALSE</span>)</span>
+<span id="cb44-28"><a href="ml.html#cb44-28" aria-hidden="true" tabindex="-1"></a><span class="fu">colnames</span>(est_ellip) <span class="ot">&lt;-</span> <span class="fu">c</span>(<span class="st">&quot;X1&quot;</span>, <span class="st">&quot;X2&quot;</span>)</span>
+<span id="cb44-29"><a href="ml.html#cb44-29" aria-hidden="true" tabindex="-1"></a>est_ellip <span class="ot">&lt;-</span> <span class="fu">as.data.frame</span>(est_ellip)</span>
+<span id="cb44-30"><a href="ml.html#cb44-30" aria-hidden="true" tabindex="-1"></a></span>
+<span id="cb44-31"><a href="ml.html#cb44-31" aria-hidden="true" tabindex="-1"></a><span class="fu">ggplot</span>() <span class="sc">+</span></span>
+<span id="cb44-32"><a href="ml.html#cb44-32" aria-hidden="true" tabindex="-1"></a>  <span class="fu">geom_point</span>(<span class="at">data =</span> <span class="fu">data.frame</span>(<span class="at">x =</span> pars_mle[<span class="dv">1</span>], <span class="at">y =</span> pars_mle[<span class="dv">2</span>]), <span class="fu">aes</span>(<span class="at">x =</span> x, <span class="at">y =</span> y)) <span class="sc">+</span></span>
+<span id="cb44-33"><a href="ml.html#cb44-33" aria-hidden="true" tabindex="-1"></a>  <span class="fu">geom_path</span>(<span class="at">data =</span> est_ellip, <span class="fu">aes</span>(<span class="at">x =</span> X1, <span class="at">y =</span> X2)) <span class="sc">+</span></span>
+<span id="cb44-34"><a href="ml.html#cb44-34" aria-hidden="true" tabindex="-1"></a>  <span class="fu">geom_point</span>(<span class="fu">aes</span>(<span class="at">x =</span> pars_theor[<span class="dv">1</span>], <span class="at">y =</span> pars_theor[<span class="dv">2</span>]), <span class="at">color =</span> <span class="st">&quot;red&quot;</span>) <span class="sc">+</span></span>
+<span id="cb44-35"><a href="ml.html#cb44-35" aria-hidden="true" tabindex="-1"></a>  <span class="fu">geom_text</span>(<span class="fu">aes</span>(<span class="at">x =</span> pars_theor[<span class="dv">1</span>], <span class="at">y =</span> pars_theor[<span class="dv">2</span>], <span class="at">label =</span> <span class="st">&quot;Theoretical parameters&quot;</span>), </span>
+<span id="cb44-36"><a href="ml.html#cb44-36" aria-hidden="true" tabindex="-1"></a>            <span class="at">color =</span> <span class="st">&quot;red&quot;</span>,</span>
+<span id="cb44-37"><a href="ml.html#cb44-37" aria-hidden="true" tabindex="-1"></a>            <span class="at">nudge_y =</span> <span class="sc">-</span><span class="fl">0.2</span>)</span></code></pre></div>
+<p><img src="bookdown-pou_files/figure-html/unnamed-chunk-24-1.png" width="672" /></p>
+</div>
+<div class="exercise">
+<p><span id="exr:unnamed-chunk-25" class="exercise"><strong>Exercise 15.9  </strong></span>Find the unit Fisher information matrix for the univariate normal distribution.</p>
+</div>
+<div class="fold">
+<div class="solution">
+<p><span id="unlabeled-div-7" class="solution"><em>Solution</em>. </span>The normal density is
+<span class="math display">\[\begin{equation*}
+  p(x; \mu, \sigma) = \frac{1}{\sqrt{2\pi \sigma^2}} \exp\left(-0.5 \frac{(x-\mu)^2}{\sigma^2}\right).
+\end{equation*}\]</span></p>
+<p>Its logarithm is
+<span class="math display">\[\begin{equation*}
+  \log p(x; \mu, \sigma) = -0.5\log(2\pi) - \log \sigma - 0.5 \frac{(x-\mu)^2}{\sigma^2}.
+\end{equation*}\]</span></p>
+<p>The second order partial derivatives are
+<span class="math display">\[\begin{align*}
+  \frac{\partial}{\partial \mu^2} p(x; \mu, \sigma) &amp;= -\frac{1}{\sigma^2}, \\
+  \frac{\partial}{\partial \mu \partial  \sigma} p(x; \mu, \sigma) &amp;= -\frac{2(x-\mu)^2}{\sigma^3}, \\
+  \frac{\partial^2}{\partial \sigma^2} p(x; \mu, \sigma) &amp;= \frac{1}{\sigma^2} - \frac{3(x-\mu)^2}{\sigma^4}.
+\end{align*}\]</span></p>
+<p>The unit Fisher information matrix is then
+<span class="math display">\[\begin{align*}
+I(\mu, \sigma) =
+  -  E\left[
+    \begin{bmatrix}
+    -\frac{1}{\sigma^2}       &amp; -\frac{2(x-\mu)}{\sigma^3} \\
+    -\frac{2(x-\mu)}{\sigma^3} &amp; \frac{1}{\sigma^2} - \frac{3(x-\mu)^2}{\sigma^4}
+  \end{bmatrix}
+  \right] =
+  \begin{bmatrix}
+      \frac{1}{\sigma^2}       &amp; 0 \\
+      0 &amp; \frac{2}{\sigma^2}
+    \end{bmatrix},
+\end{align*}\]</span>
+where we used the fact that <span class="math inline">\(E[X - \mu] = 0\)</span> and <span class="math inline">\(E[(X - \mu)^2] = \sigma^2\)</span>.</p>
+</div>
+</div>
+<div class="exercise">
+<p><span id="exr:unnamed-chunk-27" class="exercise"><strong>Exercise 15.10  </strong></span>Find the unit Fisher information for the binomial distribution with fixed <span class="math inline">\(n\)</span>.</p>
+</div>
+<div class="fold">
+<div class="solution">
+<p><span id="unlabeled-div-8" class="solution"><em>Solution</em>. </span>The binomial mass is
+<span class="math display">\[\begin{equation*}
+  P(X = k; n, p) = \binom{n}{k}p^k(1-p)^{n-k}.
+\end{equation*}\]</span></p>
+<p>Its logarithm is
+<span class="math display">\[\begin{equation*}
+  \log P(X = k; n, p) = \log \binom{n}{k} + k\log p + (n-k)\log(1-p).
+\end{equation*}\]</span></p>
+<p>The partial derivatives are
+<span class="math display">\[\begin{align*}
+  \frac{\partial}{\partial p} \log P(X = k; n, p) &amp;= \frac{k}{p} - \frac{n-k}{1-p}, \\
+  \frac{\partial^2}{\partial p^2} \log P(X = k; n, p) &amp;= -\frac{k}{p^2} - \frac{n-k}{(1-p)^2}.
+\end{align*}\]</span></p>
+<p>The unit Fisher information is
+<span class="math display">\[\begin{align*}
+I(p) =
+  -  E\left[ \frac{\partial^2}{\partial p^2} \log P(X = k; n, p) \right] =
+  \frac{n}{p(1-p)},
+\end{align*}\]</span>
+where we used the fact that <span class="math inline">\(E[k] = np\)</span> for <span class="math inline">\(k \sim X\)</span>.</p>
+</div>
 </div>
 </div>
 <div id="the-german-tank-problem" class="section level2 hasAnchor" number="15.3">
 <h2><span class="header-section-number">15.3</span> The German tank problem<a href="ml.html#the-german-tank-problem" class="anchor-section" aria-label="Anchor link to header"></a></h2>
 <div class="exercise">
-<p><span id="exr:unnamed-chunk-254" class="exercise"><strong>Exercise 15.8  (The German tank problem) </strong></span>During WWII the allied intelligence were faced with an important problem of estimating the total production of certain German tanks, such as the Panther. What turned out to be a successful approach was to estimate the maximum from the serial numbers of the small sample of captured or destroyed tanks (describe the statistical model used).</p>
+<p><span id="exr:unnamed-chunk-29" class="exercise"><strong>Exercise 15.11  (The German tank problem) </strong></span>During WWII the allied intelligence were faced with an important problem of estimating the total production of certain German tanks, such as the Panther. What turned out to be a successful approach was to estimate the maximum from the serial numbers of the small sample of captured or destroyed tanks (describe the statistical model used).</p>
 <ol style="list-style-type: lower-alpha">
 <li>What assumptions were made by using the above model? Do you think they are reasonable assumptions in practice?</li>
 <li>Show that the plug-in estimate for the maximum (i.e. the maximum of the sample) is a biased estimator.</li>
@@ -814,7 +1017,7 @@ <h2><span class="header-section-number">15.3</span> The German tank problem<a hr
 </div>
 <div class="fold">
 <div class="solution">
-<p><span id="unlabeled-div-93" class="solution"><em>Solution</em>. </span>The data are the serial numbers of the tanks. The parameter is <span class="math inline">\(n\)</span>, the total production of the tank. The distribution of the serial numbers is a discrete uniform distribution over all serial numbers.</p>
+<p><span id="unlabeled-div-9" class="solution"><em>Solution</em>. </span>The data are the serial numbers of the tanks. The parameter is <span class="math inline">\(n\)</span>, the total production of the tank. The distribution of the serial numbers is a discrete uniform distribution over all serial numbers.</p>
 <ol style="list-style-type: lower-alpha">
 <li><p>One of the assumptions is that we have i.i.d samples, however in practice this might not be true, as some tanks produced later could be sent to the field later, therefore already in theory we would not be able to recover some values from the population.</p></li>
 <li><p>To find the expected value we first need to find the distribution of <span class="math inline">\(m\)</span>. Let us start with the CDF.
@@ -840,18 +1043,18 @@ <h2><span class="header-section-number">15.3</span> The German tank problem<a hr
 <li><p>The probability that we observed our sample <span class="math inline">\(Y = {Y_1, Y_2,...,,Y_k}\)</span> given <span class="math inline">\(n\)</span> is <span class="math inline">\(\frac{1}{{n}\choose{k}}\)</span>. We need to find such <span class="math inline">\(n^*\)</span> that this function is maximized. Additionally, we have a constraint that <span class="math inline">\(n^* \geq m = \max{(Y)}\)</span>. Let us plot this function for <span class="math inline">\(m = 10\)</span> and <span class="math inline">\(k = 4\)</span>.</p></li>
 </ol>
 </div>
-<div class="sourceCode" id="cb263"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb263-1"><a href="ml.html#cb263-1" tabindex="-1"></a><span class="fu">library</span>(ggplot2)</span>
-<span id="cb263-2"><a href="ml.html#cb263-2" tabindex="-1"></a>my_fun <span class="ot">&lt;-</span> <span class="cf">function</span> (x, m, k) {</span>
-<span id="cb263-3"><a href="ml.html#cb263-3" tabindex="-1"></a>  tmp        <span class="ot">&lt;-</span>  <span class="dv">1</span> <span class="sc">/</span> (<span class="fu">choose</span>(x, k))</span>
-<span id="cb263-4"><a href="ml.html#cb263-4" tabindex="-1"></a>  tmp[x <span class="sc">&lt;</span> m] <span class="ot">&lt;-</span> <span class="dv">0</span></span>
-<span id="cb263-5"><a href="ml.html#cb263-5" tabindex="-1"></a>  <span class="fu">return</span> (tmp)</span>
-<span id="cb263-6"><a href="ml.html#cb263-6" tabindex="-1"></a>}</span>
-<span id="cb263-7"><a href="ml.html#cb263-7" tabindex="-1"></a>x  <span class="ot">&lt;-</span> <span class="dv">1</span><span class="sc">:</span><span class="dv">20</span></span>
-<span id="cb263-8"><a href="ml.html#cb263-8" tabindex="-1"></a>y  <span class="ot">&lt;-</span> <span class="fu">my_fun</span>(x, <span class="dv">10</span>, <span class="dv">4</span>)</span>
-<span id="cb263-9"><a href="ml.html#cb263-9" tabindex="-1"></a>df <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="at">x =</span> x, <span class="at">y =</span> y)</span>
-<span id="cb263-10"><a href="ml.html#cb263-10" tabindex="-1"></a><span class="fu">ggplot</span>(<span class="at">data =</span> df, <span class="fu">aes</span>(<span class="at">x =</span> x, <span class="at">y =</span> y)) <span class="sc">+</span></span>
-<span id="cb263-11"><a href="ml.html#cb263-11" tabindex="-1"></a>  <span class="fu">geom_line</span>()</span></code></pre></div>
-<p><img src="bookdown-pou_files/figure-html/unnamed-chunk-256-1.png" width="672" />
+<div class="sourceCode" id="cb45"><pre class="sourceCode r"><code class="sourceCode r"><span id="cb45-1"><a href="ml.html#cb45-1" aria-hidden="true" tabindex="-1"></a><span class="fu">library</span>(ggplot2)</span>
+<span id="cb45-2"><a href="ml.html#cb45-2" aria-hidden="true" tabindex="-1"></a>my_fun <span class="ot">&lt;-</span> <span class="cf">function</span> (x, m, k) {</span>
+<span id="cb45-3"><a href="ml.html#cb45-3" aria-hidden="true" tabindex="-1"></a>  tmp        <span class="ot">&lt;-</span>  <span class="dv">1</span> <span class="sc">/</span> (<span class="fu">choose</span>(x, k))</span>
+<span id="cb45-4"><a href="ml.html#cb45-4" aria-hidden="true" tabindex="-1"></a>  tmp[x <span class="sc">&lt;</span> m] <span class="ot">&lt;-</span> <span class="dv">0</span></span>
+<span id="cb45-5"><a href="ml.html#cb45-5" aria-hidden="true" tabindex="-1"></a>  <span class="fu">return</span> (tmp)</span>
+<span id="cb45-6"><a href="ml.html#cb45-6" aria-hidden="true" tabindex="-1"></a>}</span>
+<span id="cb45-7"><a href="ml.html#cb45-7" aria-hidden="true" tabindex="-1"></a>x  <span class="ot">&lt;-</span> <span class="dv">1</span><span class="sc">:</span><span class="dv">20</span></span>
+<span id="cb45-8"><a href="ml.html#cb45-8" aria-hidden="true" tabindex="-1"></a>y  <span class="ot">&lt;-</span> <span class="fu">my_fun</span>(x, <span class="dv">10</span>, <span class="dv">4</span>)</span>
+<span id="cb45-9"><a href="ml.html#cb45-9" aria-hidden="true" tabindex="-1"></a>df <span class="ot">&lt;-</span> <span class="fu">data.frame</span>(<span class="at">x =</span> x, <span class="at">y =</span> y)</span>
+<span id="cb45-10"><a href="ml.html#cb45-10" aria-hidden="true" tabindex="-1"></a><span class="fu">ggplot</span>(<span class="at">data =</span> df, <span class="fu">aes</span>(<span class="at">x =</span> x, <span class="at">y =</span> y)) <span class="sc">+</span></span>
+<span id="cb45-11"><a href="ml.html#cb45-11" aria-hidden="true" tabindex="-1"></a>  <span class="fu">geom_line</span>()</span></code></pre></div>
+<p><img src="bookdown-pou_files/figure-html/unnamed-chunk-31-1.png" width="672" />
 ::: {.solution}</p>
 <ol start="3" style="list-style-type: lower-alpha">
 <li><p>(continued) We observe that the maximum of this function lies at the maximum value of the sample. Therefore <span class="math inline">\(n^* = m\)</span> and ML estimate equals the plug-in estimate.</p></li>
diff --git a/docs/reference-keys.txt b/docs/reference-keys.txt
index ed6807c..04d9363 100644
--- a/docs/reference-keys.txt
+++ b/docs/reference-keys.txt
@@ -210,3 +210,12 @@ exr:unnamed-chunk-32
 exr:unnamed-chunk-35
 exr:unnamed-chunk-5
 exr:unnamed-chunk-40
+exr:unnamed-chunk-10
+exr:unnamed-chunk-19
+exr:unnamed-chunk-22
+exr:unnamed-chunk-24
+exr:unnamed-chunk-26
+exr:unnamed-chunk-28
+exr:unnamed-chunk-27
+exr:unnamed-chunk-29
+exr:unnamed-chunk-12
diff --git a/docs/search_index.json b/docs/search_index.json
index 479182c..6f2fbb8 100644
--- a/docs/search_index.json
+++ b/docs/search_index.json
@@ -1 +1 @@
-[["rvs.html", "Chapter 4 Random variables 4.1 General properties and calculations 4.2 Discrete random variables 4.3 Continuous random variables 4.4 Singular random variables 4.5 Transformations", " Chapter 4 Random variables This chapter deals with random variables and their distributions. The students are expected to acquire the following knowledge: Theoretical Identification of random variables. Convolutions of random variables. Derivation of PDF, PMF, CDF, and quantile function. Definitions and properties of common discrete random variables. Definitions and properties of common continuous random variables. Transforming univariate random variables. R Familiarize with PDF, PMF, CDF, and quantile functions for several distributions. Visual inspection of probability distributions. Analytical and empirical calculation of probabilities based on distributions. New R functions for plotting (for example, facet_wrap). Creating random number generators based on the Uniform distribution. .fold-btn { float: right; margin: 5px 5px 0 0; } .fold { border: 1px solid black; min-height: 40px; } 4.1 General properties and calculations Exercise 4.1 Which of the functions below are valid CDFs? Find their respective densities. R: Plot the three functions. \\[\\begin{equation} F(x) = \\begin{cases} 1 - e^{-x^2} &amp; x \\geq 0 \\\\ 0 &amp; x &lt; 0. \\end{cases} \\end{equation}\\] \\[\\begin{equation} F(x) = \\begin{cases} e^{-\\frac{1}{x}} &amp; x &gt; 0 \\\\ 0 &amp; x \\leq 0. \\end{cases} \\end{equation}\\] \\[\\begin{equation} F(x) = \\begin{cases} 0 &amp; x \\leq 0 \\\\ \\frac{1}{3} &amp; 0 &lt; x \\leq \\frac{1}{2} \\\\ 1 &amp; x &gt; \\frac{1}{2}. \\end{cases} \\end{equation}\\] Solution. Yes. First, let us check the limits. \\(\\lim_{x \\rightarrow -\\infty} (0) = 0\\). \\(\\lim_{x \\rightarrow \\infty} (1 - e^{-x^2}) = 1 - \\lim_{x \\rightarrow \\infty} e^{-x^2} = 1 - 0 = 1\\). Second, let us check whether the function is increasing. Let \\(x &gt; y \\geq 0\\). Then \\(1 - e^{-x^2} \\geq 1 - e^{-y^2}\\). We only have to check right continuity for the point zero. \\(F(0) = 0\\) and \\(\\lim_{\\epsilon \\downarrow 0}F (0 + \\epsilon) = \\lim_{\\epsilon \\downarrow 0} 1 - e^{-\\epsilon^2} = 1 - \\lim_{\\epsilon \\downarrow 0} e^{-\\epsilon^2} = 1 - 1 = 0\\). We get the density by differentiating the CDF. \\(p(x) = \\frac{d}{dx} 1 - e^{-x^2} = 2xe^{-x^2}.\\) Students are encouraged to check that this is a proper PDF. Yes. First, let us check the limits. $_{x -} (0) = 0 and \\(\\lim_{x \\rightarrow \\infty} (e^{-\\frac{1}{x}}) = 1\\). Second, let us check whether the function is increasing. Let \\(x &gt; y \\geq 0\\). Then \\(e^{-\\frac{1}{x}} \\geq e^{-\\frac{1}{y}}\\). We only have to check right continuity for the point zero. \\(F(0) = 0\\) and \\(\\lim_{\\epsilon \\downarrow 0}F (0 + \\epsilon) = \\lim_{\\epsilon \\downarrow 0} e^{-\\frac{1}{\\epsilon}} = 0\\). We get the density by differentiating the CDF. \\(p(x) = \\frac{d}{dx} e^{-\\frac{1}{x}} = \\frac{1}{x^2}e^{-\\frac{1}{x}}.\\) Students are encouraged to check that this is a proper PDF. No. The function is not right continuous as \\(F(\\frac{1}{2}) = \\frac{1}{3}\\), but \\(\\lim_{\\epsilon \\downarrow 0} F(\\frac{1}{2} + \\epsilon) = 1\\). f1 &lt;- function (x) { tmp &lt;- 1 - exp(-x^2) tmp[x &lt; 0] &lt;- 0 return(tmp) } f2 &lt;- function (x) { tmp &lt;- exp(-(1 / x)) tmp[x &lt;= 0] &lt;- 0 return(tmp) } f3 &lt;- function (x) { tmp &lt;- x tmp[x == x] &lt;- 1 tmp[x &lt;= 0.5] &lt;- 1/3 tmp[x &lt;= 0] &lt;- 0 return(tmp) } cdf_data &lt;- tibble(x = seq(-1, 20, by = 0.001), f1 = f1(x), f2 = f2(x), f3 = f3(x)) %&gt;% melt(id.vars = &quot;x&quot;) cdf_plot &lt;- ggplot(data = cdf_data, aes(x = x, y = value, color = variable)) + geom_hline(yintercept = 1) + geom_line() plot(cdf_plot) Exercise 4.2 Let \\(X\\) be a random variable with CDF \\[\\begin{equation} F(x) = \\begin{cases} 0 &amp; x &lt; 0 \\\\ \\frac{x^2}{2} &amp; 0 \\leq x &lt; 1 \\\\ \\frac{1}{2} + \\frac{p}{2} &amp; 1 \\leq x &lt; 2 \\\\ \\frac{1}{2} + \\frac{p}{2} + \\frac{1 - p}{2} &amp; x \\geq 2 \\end{cases} \\end{equation}\\] R: Plot this CDF for \\(p = 0.3\\). Is it a discrete, continuous, or mixed random varible? Find the probability density/mass of \\(X\\). f1 &lt;- function (x, p) { tmp &lt;- x tmp[x &gt;= 2] &lt;- 0.5 + (p * 0.5) + ((1-p) * 0.5) tmp[x &lt; 2] &lt;- 0.5 + (p * 0.5) tmp[x &lt; 1] &lt;- (x[x &lt; 1])^2 / 2 tmp[x &lt; 0] &lt;- 0 return(tmp) } cdf_data &lt;- tibble(x = seq(-1, 5, by = 0.001), y = f1(x, 0.3)) cdf_plot &lt;- ggplot(data = cdf_data, aes(x = x, y = y)) + geom_hline(yintercept = 1) + geom_line(color = &quot;blue&quot;) plot(cdf_plot) ::: {.solution} \\(X\\) is a mixed random variable. Since \\(X\\) is a mixed random variable, we have to find the PDF of the continuous part and the PMF of the discrete part. We get the continuous part by differentiating the corresponding CDF, \\(\\frac{d}{dx}\\frac{x^2}{2} = x\\). So the PDF, when \\(0 \\leq x &lt; 1\\), is \\(p(x) = x\\). Let us look at the discrete part now. It has two steps, so this is a discrete distribution with two outcomes – numbers 1 and 2. The first happens with probability \\(\\frac{p}{2}\\), and the second with probability \\(\\frac{1 - p}{2}\\). This reminds us of the Bernoulli distribution. The PMF for the discrete part is \\(P(X = x) = (\\frac{p}{2})^{2 - x} (\\frac{1 - p}{2})^{x - 1}\\). ::: Exercise 4.3 (Convolutions) Convolutions are probability distributions that correspond to sums of independent random variables. Let \\(X\\) and \\(Y\\) be independent discrete variables. Find the PMF of \\(Z = X + Y\\). Hint: Use the law of total probability. Let \\(X\\) and \\(Y\\) be independent continuous variables. Find the PDF of \\(Z = X + Y\\). Hint: Start with the CDF. Solution. \\[\\begin{align} P(Z = z) &amp;= P(X + Y = z) &amp; \\\\ &amp;= \\sum_{k = -\\infty}^\\infty P(X + Y = z | Y = k) P(Y = k) &amp; \\text{ (law of total probability)} \\\\ &amp;= \\sum_{k = -\\infty}^\\infty P(X + k = z | Y = k) P(Y = k) &amp; \\\\ &amp;= \\sum_{k = -\\infty}^\\infty P(X + k = z) P(Y = k) &amp; \\text{ (independence of $X$ and $Y$)} \\\\ &amp;= \\sum_{k = -\\infty}^\\infty P(X = z - k) P(Y = k). &amp; \\end{align}\\] Let \\(f\\) and \\(g\\) be the PDFs of \\(X\\) and \\(Y\\) respectively. \\[\\begin{align} F(z) &amp;= P(Z &lt; z) \\\\ &amp;= P(X + Y &lt; z) \\\\ &amp;= \\int_{-\\infty}^{\\infty} P(X + Y &lt; z | Y = y)P(Y = y)dy \\\\ &amp;= \\int_{-\\infty}^{\\infty} P(X + y &lt; z | Y = y)P(Y = y)dy \\\\ &amp;= \\int_{-\\infty}^{\\infty} P(X + y &lt; z)P(Y = y)dy \\\\ &amp;= \\int_{-\\infty}^{\\infty} P(X &lt; z - y)P(Y = y)dy \\\\ &amp;= \\int_{-\\infty}^{\\infty} (\\int_{-\\infty}^{z - y} f(x) dx) g(y) dy \\end{align}\\] Now \\[\\begin{align} p(z) &amp;= \\frac{d}{dz} F(z) &amp; \\\\ &amp;= \\int_{-\\infty}^{\\infty} (\\frac{d}{dz}\\int_{-\\infty}^{z - y} f(x) dx) g(y) dy &amp; \\\\ &amp;= \\int_{-\\infty}^{\\infty} f(z - y) g(y) dy &amp; \\text{ (fundamental theorem of calculus)}. \\end{align}\\] 4.2 Discrete random variables Exercise 4.4 (Binomial random variable) Let \\(X_k\\), \\(k = 1,...,n\\), be random variables with the Bernoulli measure as the PMF. Let \\(X = \\sum_{k=1}^n X_k\\). We call \\(X_k\\) a Bernoulli random variable with parameter \\(p \\in (0,1)\\). Find the CDF of \\(X_k\\). Find PMF of \\(X\\). This is a Binomial random variable with support in \\(\\{0,1,2,...,n\\}\\) and parameters \\(p \\in (0,1)\\) and \\(n \\in \\mathbb{N}_0\\). We denote \\[\\begin{equation} X | n,p \\sim \\text{binomial}(n,p). \\end{equation}\\] Find CDF of \\(X\\). R: Simulate from the binomial distribution with \\(n = 10\\) and \\(p = 0.5\\), and from \\(n\\) Bernoulli distributions with \\(p = 0.5\\). Visually compare the sum of Bernoullis and the binomial. Hint: there is no standard function like rpois for a Bernoulli random variable. Check exercise ?? to find out how to sample from a Bernoulli distribution. Solution. There are two outcomes – zero and one. Zero happens with probability \\(1 - p\\). Therefore \\[\\begin{equation} F(k) = \\begin{cases} 0 &amp; k &lt; 0 \\\\ 1 - p &amp; 0 \\leq k &lt; 1 \\\\ 1 &amp; k \\geq 1. \\end{cases} \\end{equation}\\] For the probability of \\(X\\) to be equal to some \\(k \\leq n\\), exactly \\(k\\) Bernoulli variables need to be one, and the others zero. So \\(p^k(1-p)^{n-k}\\). There are \\(\\binom{n}{k}\\) such possible arrangements. Therefore \\[\\begin{align} P(X = k) = \\binom{n}{k} p^k (1 - p)^{n-k}. \\end{align}\\] \\[\\begin{equation} F(k) = \\sum_{i = 0}^{\\lfloor k \\rfloor} \\binom{n}{i} p^i (1 - p)^{n - i} \\end{equation}\\] set.seed(1) nsamps &lt;- 10000 binom_samp &lt;- rbinom(nsamps, size = 10, prob = 0.5) bernoulli_mat &lt;- matrix(data = NA, nrow = nsamps, ncol = 10) for (i in 1:nsamps) { bernoulli_mat[i, ] &lt;- rbinom(10, size = 1, prob = 0.5) } bern_samp &lt;- apply(bernoulli_mat, 1, sum) b_data &lt;- tibble(x = c(binom_samp, bern_samp), type = c(rep(&quot;binomial&quot;, 10000), rep(&quot;Bernoulli_sum&quot;, 10000))) b_plot &lt;- ggplot(data = b_data, aes(x = x, fill = type)) + geom_bar(position = &quot;dodge&quot;) plot(b_plot) Exercise 4.5 (Geometric random variable) A variable with PMF \\[\\begin{equation} P(k) = p(1-p)^k \\end{equation}\\] is a geometric random variable with support in non-negative integers. It has one parameter \\(p \\in (0,1]\\). We denote \\[\\begin{equation} X | p \\sim \\text{geometric}(p) \\end{equation}\\] Derive the CDF of a geometric random variable. R: Draw 1000 samples from the geometric distribution with \\(p = 0.3\\) and compare their frequencies to theoretical values. Solution. \\[\\begin{align} P(X \\leq k) &amp;= \\sum_{i = 0}^k p(1-p)^i \\\\ &amp;= p \\sum_{i = 0}^k (1-p)^i \\\\ &amp;= p \\frac{1 - (1-p)^{k+1}}{1 - (1 - p)} \\\\ &amp;= 1 - (1-p)^{k + 1} \\end{align}\\] set.seed(1) geo_samp &lt;- rgeom(n = 1000, prob = 0.3) geo_samp &lt;- data.frame(x = geo_samp) %&gt;% count(x) %&gt;% mutate(n = n / 1000, type = &quot;empirical_frequencies&quot;) %&gt;% bind_rows(data.frame(x = 0:20, n = dgeom(0:20, prob = 0.3), type = &quot;theoretical_measure&quot;)) geo_plot &lt;- ggplot(data = geo_samp, aes(x = x, y = n, fill = type)) + geom_bar(stat=&quot;identity&quot;, position = &quot;dodge&quot;) plot(geo_plot) Exercise 4.6 (Poisson random variable) A variable with PMF \\[\\begin{equation} P(k) = \\frac{\\lambda^k e^{-\\lambda}}{k!} \\end{equation}\\] is a Poisson random variable with support in non-negative integers. It has one positive parameter \\(\\lambda\\), which also represents its mean value and variance (a measure of the deviation of the values from the mean – more on mean and variance in the next chapter). We denote \\[\\begin{equation} X | \\lambda \\sim \\text{Poisson}(\\lambda). \\end{equation}\\] This distribution is usually the default choice for modeling counts. We have already encountered a Poisson random variable in exercise ??, where we also sampled from this distribution. The CDF of a Poisson random variable is \\(P(X &lt;= x) = e^{-\\lambda} \\sum_{i=0}^x \\frac{\\lambda^{i}}{i!}\\). R: Draw 1000 samples from the Poisson distribution with \\(\\lambda = 5\\) and compare their empirical cumulative distribution function with the theoretical CDF. set.seed(1) pois_samp &lt;- rpois(n = 1000, lambda = 5) pois_samp &lt;- data.frame(x = pois_samp) pois_plot &lt;- ggplot(data = pois_samp, aes(x = x, colour = &quot;ECDF&quot;)) + stat_ecdf(geom = &quot;step&quot;) + geom_step(data = tibble(x = 0:17, y = ppois(x, 5)), aes(x = x, y = y, colour = &quot;CDF&quot;)) + scale_colour_manual(&quot;Lgend title&quot;, values = c(&quot;black&quot;, &quot;red&quot;)) plot(pois_plot) Exercise 4.7 (Negative binomial random variable) A variable with PMF \\[\\begin{equation} p(k) = \\binom{k + r - 1}{k}(1-p)^r p^k \\end{equation}\\] is a negative binomial random variable with support in non-negative integers. It has two parameters \\(r &gt; 0\\) and \\(p \\in (0,1)\\). We denote \\[\\begin{equation} X | r,p \\sim \\text{NB}(r,p). \\end{equation}\\] Let us reparameterize the negative binomial distribution with \\(q = 1 - p\\). Find the PMF of \\(X \\sim \\text{NB}(1, q)\\). Do you recognize this distribution? Show that the sum of two negative binomial random variables with the same \\(p\\) is also a negative binomial random variable. Hint: Use the fact that the number of ways to place \\(n\\) indistinct balls into \\(k\\) boxes is \\(\\binom{n + k - 1}{n}\\). R: Draw samples from \\(X \\sim \\text{NB}(5, 0.4)\\) and \\(Y \\sim \\text{NB}(3, 0.4)\\). Draw samples from \\(Z = X + Y\\), where you use the parameters calculated in b). Plot both distributions, their sum, and \\(Z\\) using facet_wrap. Be careful, as R uses a different parameterization size=\\(r\\) and prob=\\(1 - p\\). Solution. \\[\\begin{align} P(X = k) &amp;= \\binom{k + 1 - 1}{k}q^1 (1-q)^k \\\\ &amp;= q(1-q)^k. \\end{align}\\] This is the geometric distribution. Let \\(X \\sim \\text{NB}(r_1, p)\\) and \\(Y \\sim \\text{NB}(r_2, p)\\). Let \\(Z = X + Y\\). \\[\\begin{align} P(Z = z) &amp;= \\sum_{k = 0}^{\\infty} P(X = z - k)P(Y = k), \\text{ if k &lt; 0, then the probabilities are 0} \\\\ &amp;= \\sum_{k = 0}^{z} P(X = z - k)P(Y = k), \\text{ if k &gt; z, then the probabilities are 0} \\\\ &amp;= \\sum_{k = 0}^{z} \\binom{z - k + r_1 - 1}{z - k}(1 - p)^{r_1} p^{z - k} \\binom{k + r_2 - 1}{k}(1 - p)^{r_2} p^{k} &amp; \\\\ &amp;= \\sum_{k = 0}^{z} \\binom{z - k + r_1 - 1}{z - k} \\binom{k + r_2 - 1}{k}(1 - p)^{r_1 + r_2} p^{z} &amp; \\\\ &amp;= (1 - p)^{r_1 + r_2} p^{z} \\sum_{k = 0}^{z} \\binom{z - k + r_1 - 1}{z - k} \\binom{k + r_2 - 1}{k}&amp; \\end{align}\\] The part before the sum reminds us of the negative binomial distribution with parameters \\(r_1 + r_2\\) and \\(p\\). To complete this term to the negative binomial PMF we need \\(\\binom{z + r_1 + r_2 -1}{z}\\). So the only thing we need to prove is that the sum equals this term. Both terms in the sum can be interpreted as numbers of ways to place a number of balls into boxes. For the left term it is \\(z-k\\) balls into \\(r_1\\) boxes, and for the right \\(k\\) balls into \\(r_2\\) boxes. For each \\(k\\) we are distributing \\(z\\) balls in total. By summing over all \\(k\\), we actually get all the possible placements of \\(z\\) balls into \\(r_1 + r_2\\) boxes. Therefore \\[\\begin{align} P(Z = z) &amp;= (1 - p)^{r_1 + r_2} p^{z} \\sum_{k = 0}^{z} \\binom{z - k + r_1 - 1}{z - k} \\binom{k + r_2 - 1}{k}&amp; \\\\ &amp;= \\binom{z + r_1 + r_2 -1}{z} (1 - p)^{r_1 + r_2} p^{z}. \\end{align}\\] From this it also follows that the sum of geometric distributions with the same parameter is a negative binomial distribution. \\(Z \\sim \\text{NB}(8, 0.4)\\). set.seed(1) nsamps &lt;- 10000 x &lt;- rnbinom(nsamps, size = 5, prob = 0.6) y &lt;- rnbinom(nsamps, size = 3, prob = 0.6) xpy &lt;- x + y z &lt;- rnbinom(nsamps, size = 8, prob = 0.6) samps &lt;- tibble(x, y, xpy, z) samps &lt;- melt(samps) ggplot(data = samps, aes(x = value)) + geom_bar() + facet_wrap(~ variable) 4.3 Continuous random variables Exercise 4.8 (Exponential random variable) A variable \\(X\\) with PDF \\(\\lambda e^{-\\lambda x}\\) is an exponential random variable with support in non-negative real numbers. It has one positive parameter \\(\\lambda\\). We denote \\[\\begin{equation} X | \\lambda \\sim \\text{Exp}(\\lambda). \\end{equation}\\] Find the CDF of an exponential random variable. Find the quantile function of an exponential random variable. Calculate the probability \\(P(1 \\leq X \\leq 3)\\), where \\(X \\sim \\text{Exp(1.5)}\\). R: Check your answer to c) with a simulation (rexp). Plot the probability in a meaningful way. R: Implement PDF, CDF, and the quantile function and compare their values with corresponding R functions visually. Hint: use the size parameter to make one of the curves wider. Solution. \\[\\begin{align} F(x) &amp;= \\int_{0}^{x} \\lambda e^{-\\lambda t} dt \\\\ &amp;= \\lambda \\int_{0}^{x} e^{-\\lambda t} dt \\\\ &amp;= \\lambda (\\frac{1}{-\\lambda}e^{-\\lambda t} |_{0}^{x}) \\\\ &amp;= \\lambda(\\frac{1}{\\lambda} - \\frac{1}{\\lambda} e^{-\\lambda x}) \\\\ &amp;= 1 - e^{-\\lambda x}. \\end{align}\\] \\[\\begin{align} F(F^{-1}(x)) &amp;= x \\\\ 1 - e^{-\\lambda F^{-1}(x)} &amp;= x \\\\ e^{-\\lambda F^{-1}(x)} &amp;= 1 - x \\\\ -\\lambda F^{-1}(x) &amp;= \\ln(1 - x) \\\\ F^{-1}(x) &amp;= - \\frac{ln(1 - x)}{\\lambda}. \\end{align}\\] \\[\\begin{align} P(1 \\leq X \\leq 3) &amp;= P(X \\leq 3) - P(X \\leq 1) \\\\ &amp;= P(X \\leq 3) - P(X \\leq 1) \\\\ &amp;= 1 - e^{-1.5 \\times 3} - 1 + e^{-1.5 \\times 1} \\\\ &amp;\\approx 0.212. \\end{align}\\] set.seed(1) nsamps &lt;- 1000 samps &lt;- rexp(nsamps, rate = 1.5) sum(samps &gt;= 1 &amp; samps &lt;= 3) / nsamps ## [1] 0.212 exp_plot &lt;- ggplot(data.frame(x = seq(0, 5, by = 0.01)), aes(x = x)) + stat_function(fun = dexp, args = list(rate = 1.5)) + stat_function(fun = dexp, args = list(rate = 1.5), xlim = c(1,3), geom = &quot;area&quot;, fill = &quot;red&quot;) plot(exp_plot) exp_pdf &lt;- function(x, lambda) { return (lambda * exp(-lambda * x)) } exp_cdf &lt;- function(x, lambda) { return (1 - exp(-lambda * x)) } exp_quant &lt;- function(q, lambda) { return (-(log(1 - q) / lambda)) } ggplot(data = data.frame(x = seq(0, 5, by = 0.01)), aes(x = x)) + stat_function(fun = dexp, args = list(rate = 1.5), aes(color = &quot;R&quot;), size = 2.5) + stat_function(fun = exp_pdf, args = list(lambda = 1.5), aes(color = &quot;Mine&quot;), size = 1.2) + scale_color_manual(values = c(&quot;red&quot;, &quot;black&quot;)) ggplot(data = data.frame(x = seq(0, 5, by = 0.01)), aes(x = x)) + stat_function(fun = pexp, args = list(rate = 1.5), aes(color = &quot;R&quot;), size = 2.5) + stat_function(fun = exp_cdf, args = list(lambda = 1.5), aes(color = &quot;Mine&quot;), size = 1.2) + scale_color_manual(values = c(&quot;red&quot;, &quot;black&quot;)) ggplot(data = data.frame(x = seq(0, 1, by = 0.01)), aes(x = x)) + stat_function(fun = qexp, args = list(rate = 1.5), aes(color = &quot;R&quot;), size = 2.5) + stat_function(fun = exp_quant, args = list(lambda = 1.5), aes(color = &quot;Mine&quot;), size = 1.2) + scale_color_manual(values = c(&quot;red&quot;, &quot;black&quot;)) Exercise 4.9 (Uniform random variable) Continuous uniform random variable with parameters \\(a\\) and \\(b\\) has the PDF \\[\\begin{equation} p(x) = \\begin{cases} \\frac{1}{b - a} &amp; x \\in [a,b] \\\\ 0 &amp; \\text{otherwise}. \\end{cases} \\end{equation}\\] Find the CDF of the uniform random variable. Find the quantile function of the uniform random variable. Let \\(X \\sim \\text{Uniform}(a,b)\\). Find the CDF of the variable \\(Y = \\frac{X - a}{b - a}\\). This is the standard uniform random variable. Let \\(X \\sim \\text{Uniform}(-1, 3)\\). Find such \\(z\\) that \\(P(X &lt; z + \\mu_x) = \\frac{1}{5}\\). R: Check your result from d) using simulation. Solution. \\[\\begin{align} F(x) &amp;= \\int_{a}^x \\frac{1}{b - a} dt \\\\ &amp;= \\frac{1}{b - a} \\int_{a}^x dt \\\\ &amp;= \\frac{x - a}{b - a}. \\end{align}\\] \\[\\begin{align} F(F^{-1}(p)) &amp;= p \\\\ \\frac{F^{-1}(p) - a}{b - a} &amp;= p \\\\ F^{-1}(p) &amp;= p(b - a) + a. \\end{align}\\] \\[\\begin{align} F_Y(y) &amp;= P(Y &lt; y) \\\\ &amp;= P(\\frac{X - a}{b - a} &lt; y) \\\\ &amp;= P(X &lt; y(b - a) + a) \\\\ &amp;= F_X(y(b - a) + a) \\\\ &amp;= \\frac{(y(b - a) + a) - a}{b - a} \\\\ &amp;= y. \\end{align}\\] \\[\\begin{align} P(X &lt; z + 1) &amp;= \\frac{1}{5} \\\\ F(z + 1) &amp;= \\frac{1}{5} \\\\ z + 1 &amp;= F^{-1}(\\frac{1}{5}) \\\\ z &amp;= \\frac{1}{5}4 - 1 - 1 \\\\ z &amp;= -1.2. \\end{align}\\] set.seed(1) a &lt;- -1 b &lt;- 3 nsamps &lt;- 10000 unif_samp &lt;- runif(nsamps, a, b) mu_x &lt;- mean(unif_samp) new_samp &lt;- unif_samp - mu_x quantile(new_samp, probs = 1/5) ## 20% ## -1.203192 punif(-0.2, -1, 3) ## [1] 0.2 Exercise 4.10 (Beta random variable) A variable \\(X\\) with PDF \\[\\begin{equation} p(x) = \\frac{x^{\\alpha - 1} (1 - x)^{\\beta - 1}}{\\text{B}(\\alpha, \\beta)}, \\end{equation}\\] where \\(\\text{B}(\\alpha, \\beta) = \\frac{\\Gamma(\\alpha) \\Gamma(\\beta)}{\\Gamma(\\alpha + \\beta)}\\) and \\(\\Gamma(x) = \\int_0^{\\infty} x^{z - 1} e^{-x} dx\\) is a Beta random variable with support on \\([0,1]\\). It has two positive parameters \\(\\alpha\\) and \\(\\beta\\). Notation: \\[\\begin{equation} X | \\alpha, \\beta \\sim \\text{Beta}(\\alpha, \\beta) \\end{equation}\\] It is often used in modeling rates. Calculate the PDF for \\(\\alpha = 1\\) and \\(\\beta = 1\\). What do you notice? R: Plot densities of the beta distribution for parameter pairs (2, 2), (4, 1), (1, 4), (2, 5), and (0.1, 0.1). R: Sample from \\(X \\sim \\text{Beta}(2, 5)\\) and compare the histogram with Beta PDF. Solution. \\[\\begin{equation} p(x) = \\frac{x^{1 - 1} (1 - x)^{1 - 1}}{\\text{B}(1, 1)} = 1. \\end{equation}\\] This is the standard uniform distribution. set.seed(1) ggplot(data = data.frame(x = seq(0, 1, by = 0.01)), aes(x = x)) + stat_function(fun = dbeta, args = list(shape1 = 2, shape2 = 2), aes(color = &quot;alpha = 0.5&quot;)) + stat_function(fun = dbeta, args = list(shape1 = 4, shape2 = 1), aes(color = &quot;alpha = 4&quot;)) + stat_function(fun = dbeta, args = list(shape1 = 1, shape2 = 4), aes(color = &quot;alpha = 1&quot;)) + stat_function(fun = dbeta, args = list(shape1 = 2, shape2 = 5), aes(color = &quot;alpha = 25&quot;)) + stat_function(fun = dbeta, args = list(shape1 = 0.1, shape2 = 0.1), aes(color = &quot;alpha = 0.1&quot;)) set.seed(1) nsamps &lt;- 1000 samps &lt;- rbeta(nsamps, 2, 5) ggplot(data = data.frame(x = samps), aes(x = x)) + geom_histogram(aes(y = ..density..), color = &quot;black&quot;) + stat_function(data = data.frame(x = seq(0, 1, by = 0.01)), aes(x = x), fun = dbeta, args = list(shape1 = 2, shape2 = 5), color = &quot;red&quot;, size = 1.2) Exercise 4.11 (Gamma random variable) A random variable with PDF \\[\\begin{equation} p(x) = \\frac{\\beta^\\alpha}{\\Gamma(\\alpha)} x^{\\alpha - 1}e^{-\\beta x} \\end{equation}\\] is a Gamma random variable with support on the positive numbers and parameters shape \\(\\alpha &gt; 0\\) and rate \\(\\beta &gt; 0\\). We write \\[\\begin{equation} X | \\alpha, \\beta \\sim \\text{Gamma}(\\alpha, \\beta) \\end{equation}\\] and it’s CDF is \\[\\begin{equation} \\frac{\\gamma(\\alpha, \\beta x)}{\\Gamma(\\alpha)}, \\end{equation}\\] where \\(\\gamma(s, x) = \\int_0^x t^{s-1} e^{-t} dt\\). It is usually used in modeling positive phenomena (for example insurance claims and rainfalls). Let \\(X \\sim \\text{Gamma}(1, \\beta)\\). Find the PDF of \\(X\\). Do you recognize this PDF? Let \\(k = \\alpha\\) and \\(\\theta = \\frac{1}{\\beta}\\). Find the PDF of \\(X | k, \\theta \\sim \\text{Gamma}(k, \\theta)\\). Random variables can be reparameterized, and sometimes a reparameterized distribution is more suitable for certain calculations. The first parameterization is for example usually used in Bayesian statistics, while this parameterization is more common in econometrics and some other applied fields. Note that you also need to pay attention to the parameters in statistical software, so diligently read the help files when using functions like rgamma to see how the function is parameterized. R: Plot gamma CDF for random variables with shape and rate parameters (1,1), (10,1), (1,10). Solution. \\[\\begin{align} p(x) &amp;= \\frac{\\beta^1}{\\Gamma(1)} x^{1 - 1}e^{-\\beta x} \\\\ &amp;= \\beta e^{-\\beta x} \\end{align}\\] This is the PDF of the exponential distribution with parameter \\(\\beta\\). \\[\\begin{align} p(x) &amp;= \\frac{1}{\\Gamma(k)\\beta^k} x^{k - 1}e^{-\\frac{x}{\\theta}}. \\end{align}\\] set.seed(1) ggplot(data = data.frame(x = seq(0, 25, by = 0.01)), aes(x = x)) + stat_function(fun = pgamma, args = list(shape = 1, rate = 1), aes(color = &quot;Gamma(1,1)&quot;)) + stat_function(fun = pgamma, args = list(shape = 10, rate = 1), aes(color = &quot;Gamma(10,1)&quot;)) + stat_function(fun = pgamma, args = list(shape = 1, rate = 10), aes(color = &quot;Gamma(1,10)&quot;)) Exercise 4.12 (Normal random variable) A random variable with PDF \\[\\begin{equation} p(x) = \\frac{1}{\\sqrt{2 \\pi \\sigma^2}} e^{-\\frac{(x - \\mu)^2}{2 \\sigma^2}} \\end{equation}\\] is a normal random variable with support on the real axis and parameters \\(\\mu\\) in reals and \\(\\sigma^2 &gt; 0\\). The first is the mean parameter and the second is the variance parameter. Many statistical methods assume a normal distribution. We denote \\[\\begin{equation} X | \\mu, \\sigma \\sim \\text{N}(\\mu, \\sigma^2), \\end{equation}\\] and it’s CDF is \\[\\begin{equation} F(x) = \\int_{-\\infty}^x \\frac{1}{\\sqrt{2 \\pi \\sigma^2}} e^{-\\frac{(t - \\mu)^2}{2 \\sigma^2}} dt, \\end{equation}\\] which is intractable and is usually approximated. Due to its flexibility it is also one of the most researched distributions. For that reason statisticians often use transformations of variables or approximate distributions with the normal distribution. Show that a variable \\(\\frac{X - \\mu}{\\sigma} \\sim \\text{N}(0,1)\\). This transformation is called standardization, and \\(\\text{N}(0,1)\\) is a standard normal distribution. R: Plot the normal distribution with \\(\\mu = 0\\) and different values for the \\(\\sigma\\) parameter. R: The normal distribution provides a good approximation for the Poisson distribution with a large \\(\\lambda\\). Let \\(X \\sim \\text{Poisson}(50)\\). Approximate \\(X\\) with the normal distribution and compare its density with the Poisson histogram. What are the values of \\(\\mu\\) and \\(\\sigma^2\\) that should provide the best approximation? Note that R function rnorm takes standard deviation (\\(\\sigma\\)) as a parameter and not variance. Solution. \\[\\begin{align} P(\\frac{X - \\mu}{\\sigma} &lt; x) &amp;= P(X &lt; \\sigma x + \\mu) \\\\ &amp;= F(\\sigma x + \\mu) \\\\ &amp;= \\int_{-\\infty}^{\\sigma x + \\mu} \\frac{1}{\\sqrt{2 \\pi \\sigma^2}} e^{-\\frac{(t - \\mu)^2}{2\\sigma^2}} dt \\end{align}\\] Now let \\(s = f(t) = \\frac{t - \\mu}{\\sigma}\\), then \\(ds = \\frac{dt}{\\sigma}\\) and \\(f(\\sigma x + \\mu) = x\\), so \\[\\begin{align} P(\\frac{X - \\mu}{\\sigma} &lt; x) &amp;= \\int_{-\\infty}^{x} \\frac{1}{\\sqrt{2 \\pi}} e^{-\\frac{s^2}{2}} ds. \\end{align}\\] There is no need to evaluate this integral, as we recognize it as the CDF of a normal distribution with \\(\\mu = 0\\) and \\(\\sigma^2 = 1\\). set.seed(1) # b ggplot(data = data.frame(x = seq(-15, 15, by = 0.01)), aes(x = x)) + stat_function(fun = dnorm, args = list(mean = 0, sd = 1), aes(color = &quot;sd = 1&quot;)) + stat_function(fun = dnorm, args = list(mean = 0, sd = 0.4), aes(color = &quot;sd = 0.1&quot;)) + stat_function(fun = dnorm, args = list(mean = 0, sd = 2), aes(color = &quot;sd = 2&quot;)) + stat_function(fun = dnorm, args = list(mean = 0, sd = 5), aes(color = &quot;sd = 5&quot;)) # c mean_par &lt;- 50 nsamps &lt;- 100000 pois_samps &lt;- rpois(nsamps, lambda = mean_par) norm_samps &lt;- rnorm(nsamps, mean = mean_par, sd = sqrt(mean_par)) my_plot &lt;- ggplot() + geom_bar(data = tibble(x = pois_samps), aes(x = x, y = (..count..)/sum(..count..))) + geom_density(data = tibble(x = norm_samps), aes(x = x), color = &quot;red&quot;) plot(my_plot) Exercise 4.13 (Logistic random variable) A logistic random variable has CDF \\[\\begin{equation} F(x) = \\frac{1}{1 + e^{-\\frac{x - \\mu}{s}}}, \\end{equation}\\] where \\(\\mu\\) is real and \\(s &gt; 0\\). The support is on the real axis. We denote \\[\\begin{equation} X | \\mu, s \\sim \\text{Logistic}(\\mu, s). \\end{equation}\\] The distribution of the logistic random variable resembles a normal random variable, however it has heavier tails. Find the PDF of a logistic random variable. R: Implement logistic PDF and CDF and visually compare both for \\(X \\sim \\text{N}(0, 1)\\) and \\(Y \\sim \\text{logit}(0, \\sqrt{\\frac{3}{\\pi^2}})\\). These distributions have the same mean and variance. Additionally, plot the same plot on the interval [5,10], to better see the difference in the tails. R: For the distributions in b) find the probability \\(P(|X| &gt; 4)\\) and interpret the result. Solution. \\[\\begin{align} p(x) &amp;= \\frac{d}{dx} \\frac{1}{1 + e^{-\\frac{x - \\mu}{s}}} \\\\ &amp;= \\frac{- \\frac{d}{dx} (1 + e^{-\\frac{x - \\mu}{s}})}{(1 + e{-\\frac{x - \\mu}{s}})^2} \\\\ &amp;= \\frac{e^{-\\frac{x - \\mu}{s}}}{s(1 + e{-\\frac{x - \\mu}{s}})^2}. \\end{align}\\] # b set.seed(1) logit_pdf &lt;- function (x, mu, s) { return ((exp(-(x - mu)/(s))) / (s * (1 + exp(-(x - mu)/(s)))^2)) } nl_plot &lt;- ggplot(data = data.frame(x = seq(-12, 12, by = 0.01)), aes(x = x)) + stat_function(fun = dnorm, args = list(mean = 0, sd = 2), aes(color = &quot;normal&quot;)) + stat_function(fun = logit_pdf, args = list(mu = 0, s = sqrt(12/pi^2)), aes(color = &quot;logit&quot;)) plot(nl_plot) nl_plot &lt;- ggplot(data = data.frame(x = seq(5, 10, by = 0.01)), aes(x = x)) + stat_function(fun = dnorm, args = list(mean = 0, sd = 2), aes(color = &quot;normal&quot;)) + stat_function(fun = logit_pdf, args = list(mu = 0, s = sqrt(12/pi^2)), aes(color = &quot;logit&quot;)) plot(nl_plot) # c logit_cdf &lt;- function (x, mu, s) { return (1 / (1 + exp(-(x - mu) / s))) } p_logistic &lt;- 1 - logit_cdf(4, 0, sqrt(12/pi^2)) + logit_cdf(-4, 0, sqrt(12/pi^2)) p_norm &lt;- 1 - pnorm(4, 0, 2) + pnorm(-4, 0, 2) p_logistic ## [1] 0.05178347 p_norm ## [1] 0.04550026 # Logistic distribution has wider tails, therefore the probability of larger # absolute values is higher. 4.4 Singular random variables Exercise 4.14 (Cantor distribution) The Cantor set is a subset of \\([0,1]\\), which we create by iteratively deleting the middle third of the interval. For example, in the first iteration, we get the sets \\([0,\\frac{1}{3}]\\) and \\([\\frac{2}{3},1]\\). In the second iteration, we get \\([0,\\frac{1}{9}]\\), \\([\\frac{2}{9},\\frac{1}{3}]\\), \\([\\frac{2}{3}, \\frac{7}{9}]\\), and \\([\\frac{8}{9}, 1]\\). On the \\(n\\)-th iteration, we have \\[\\begin{equation} C_n = \\frac{C_{n-1}}{3} \\cup \\bigg(\\frac{2}{3} + \\frac{C_{n-1}}{3} \\bigg), \\end{equation}\\] where \\(C_0 = [0,1]\\). The Cantor set is then defined as the intersection of these sets \\[\\begin{equation} C = \\cap_{n=1}^{\\infty} C_n. \\end{equation}\\] It has the same cardinality as \\([0,1]\\). Another way to define the Cantor set is the set of all numbers on \\([0,1]\\), that do not have a 1 in the ternary representation \\(x = \\sum_{n=1}^\\infty \\frac{x_i}{3^i}, x_i \\in \\{0,1,2\\}\\). A random variable follows the Cantor distribution, if its CDF is the Cantor function (below). You can find the implementations of random number generator, CDF, and quantile functions for the Cantor distributions at https://github.com/Henrygb/CantorDist.R. Show that the Lebesgue measure of the Cantor set is 0. (Jagannathan) Let us look at an infinite sequence of independent fair-coin tosses. If the outcome is heads, let \\(x_i = 2\\) and \\(x_i = 0\\), when tails. Then use these to create \\(x = \\sum_{n=1}^\\infty \\frac{x_i}{3^i}\\). This is a random variable with the Cantor distribution. Show that \\(X\\) has a singular distribution. Solution. \\[\\begin{align} \\lambda(C) &amp;= 1 - \\lambda(C^c) \\\\ &amp;= 1 - \\frac{1}{3}\\sum_{k = 0}^\\infty (\\frac{2}{3})^k \\\\ &amp;= 1 - \\frac{\\frac{1}{3}}{1 - \\frac{2}{3}} \\\\ &amp;= 0. \\end{align}\\] First, for every \\(x\\), the probability of observing it is \\(\\lim_{n \\rightarrow \\infty} \\frac{1}{2^n} = 0\\). Second, the probability that we observe one of all the possible sequences is 1. Therefore \\(P(C) = 1\\). So this is a singular variable. The CDF only increments on the elements of the Cantor set. 4.5 Transformations Exercise 4.15 Let \\(X\\) be a random variable that is uniformly distributed on \\(\\{-2, -1, 0, 1, 2\\}\\). Find the PMF of \\(Y = X^2\\). Solution. \\[\\begin{align} P_Y(y) = \\sum_{x \\in \\sqrt(y)} P_X(x) = \\begin{cases} 0 &amp; y \\notin \\{0,1,4\\} \\\\ \\frac{1}{5} &amp; y = 0 \\\\ \\frac{2}{5} &amp; y \\in \\{1,4\\} \\end{cases} \\end{align}\\] Exercise 4.16 (Continuous uniform random variable) Let \\(X \\sim U(-1, 1)\\) be uniformly distributed on \\([-1, 1]\\) and let \\(Y = X^2\\). Find the CDF of \\(Y\\), the PDF of \\(Y\\), and ensure that the obtained PDF integrates to 1. Find the CDF of \\(Y\\). Find the PDF of \\(Y\\) and verify that it integrates to 1. R: Plot histograms of samples from \\(X\\) and \\(Y\\) and overlay the true densities. Solution. We first observe that \\(Y \\in [0, 1]\\). If a sample from \\(Y\\) is less than \\(\\alpha\\), the corresponding sample from \\(X\\) must be in \\(\\left[-\\sqrt{\\alpha}, \\sqrt{\\alpha}\\right]\\). \\[\\begin{align} F_Y(\\alpha) = P_X(X \\in \\left[-\\sqrt{\\alpha}, \\sqrt{\\alpha}\\right]) &amp;= F_X(\\sqrt{\\alpha}) - F_X(-\\sqrt{\\alpha}) \\\\ &amp;= \\frac{\\sqrt{\\alpha} + 1}{2} - \\frac{-\\sqrt{\\alpha} + 1}{2} = \\sqrt{\\alpha}. \\end{align}\\] \\[\\begin{align} f_Y(\\alpha) = \\frac{\\partial}{\\partial \\alpha} F_Y(\\alpha) = \\frac{\\partial}{\\partial \\alpha} \\sqrt{\\alpha} = \\frac{1}{2\\sqrt{\\alpha}}. \\end{align}\\] \\[\\begin{align} \\int_{0}^1f_Y(\\alpha)d\\alpha = 0.5\\int_{0}^1 \\frac{1}{\\alpha}d\\alpha = 0.5\\left[\\frac{\\alpha^{0.5}}{0.5}\\right]_0^1 = 1 - 0 = 1. \\end{align}\\] # Draw samples to plot set.seed(0) n &lt;- 10000 x &lt;- runif(n, min=-1, max=1) y &lt;- runif(n, min=-1, max=1)^2 # Dataframe of samples df &lt;- data.frame(value=c(x, y), RV=c( rep(&quot;X&quot;, n), rep(&quot;Y&quot;, n) )) # Dataframe with analytically computed density of Y df_y_analytic &lt;- data.frame(y=seq(1e-2, 1, length.out=1000)) df_y_analytic$density &lt;- 1 / (2 * sqrt(df_y_analytic$y)) library(ggplot2) ggplot(df) + geom_histogram(aes(x=value, after_stat(density), fill=RV), alpha=0.5, bins=50, position = &quot;identity&quot;) + stat_function(fun = function(u) 1/2, color=&quot;red&quot;) + geom_path(data=df_y_analytic, aes(x=y, y=density), color=&quot;blue&quot;) Exercise 4.17 (Lognormal random variable) A lognormal random variable is a variable whose logarithm is normally distributed. In practice, we often encounter skewed data. Usually using a log transformation on such data makes it more symmetric and therefore more suitable for modeling with the normal distribution (more on why we wish to model data with the normal distribution in the following chapters). Let \\(X \\sim \\text{N}(\\mu,\\sigma)\\). Find the PDF of \\(Y: \\log(Y) = X\\). R: Sample from the lognormal distribution with parameters \\(\\mu = 5\\) and \\(\\sigma = 2\\). Plot a histogram of the samples. Then log-transform the samples and plot a histogram along with the theoretical normal PDF. Solution. \\[\\begin{align} p_Y(y) &amp;= p_X(\\log(y)) \\frac{d}{dy} \\log(y) \\\\ &amp;= \\frac{1}{\\sqrt{2 \\pi \\sigma^2}} e^{\\frac{(\\log(y) - \\mu)^2}{2 \\sigma^2}} \\frac{1}{y} \\\\ &amp;= \\frac{1}{y \\sqrt{2 \\pi \\sigma^2}} e^{\\frac{(\\log(y) - \\mu)^2}{2 \\sigma^2}}. \\end{align}\\] set.seed(1) nsamps &lt;- 10000 mu &lt;- 0.5 sigma &lt;- 0.4 ln_samps &lt;- rlnorm(nsamps, mu, sigma) ln_plot &lt;- ggplot(data = data.frame(x = ln_samps), aes(x = x)) + geom_histogram(color = &quot;black&quot;) plot(ln_plot) norm_samps &lt;- log(ln_samps) n_plot &lt;- ggplot(data = data.frame(x = norm_samps), aes(x = x)) + geom_histogram(aes(y = ..density..), color = &quot;black&quot;) + stat_function(fun = dnorm, args = list(mean = mu, sd = sigma), color = &quot;red&quot;) plot(n_plot) Exercise 4.18 (Probability integral transform) This exercise is borrowed from Wasserman. Let \\(X\\) have a continuous, strictly increasing CDF \\(F\\). Let \\(Y = F(X)\\). Find the density of \\(Y\\). This is called the probability integral transform. Let \\(U \\sim \\text{Uniform}(0,1)\\) and let \\(X = F^{-1}(U)\\). Show that \\(X \\sim F\\). R: Implement a program that takes Uniform(0,1) random variables and generates random variables from an exponential(\\(\\beta\\)) distribution. Compare your implemented function with function rexp in R. Solution. \\[\\begin{align} F_Y(y) &amp;= P(Y &lt; y) \\\\ &amp;= P(F(X) &lt; y) \\\\ &amp;= P(X &lt; F_X^{-1}(y)) \\\\ &amp;= F_X(F_X^{-1}(y)) \\\\ &amp;= y. \\end{align}\\] From the above it follows that \\(p(y) = 1\\). Note that we need to know the inverse CDF to be able to apply this procedure. \\[\\begin{align} P(X &lt; x) &amp;= P(F^{-1}(U) &lt; x) \\\\ &amp;= P(U &lt; F(x)) \\\\ &amp;= F_U(F(x)) \\\\ &amp;= F(x). \\end{align}\\] set.seed(1) nsamps &lt;- 10000 beta &lt;- 4 generate_exp &lt;- function (n, beta) { tmp &lt;- runif(n) X &lt;- qexp(tmp, beta) return (X) } df &lt;- tibble(&quot;R&quot; = rexp(nsamps, beta), &quot;myGenerator&quot; = generate_exp(nsamps, beta)) %&gt;% gather() ggplot(data = df, aes(x = value, fill = key)) + geom_histogram(position = &quot;dodge&quot;) "],["404.html", "Page not found", " Page not found The page you requested cannot be found (perhaps it was moved or renamed). You may want to try searching to find the page's new location, or use the table of contents to find the page you are looking for. "]]
+[["boot.html", "Chapter 14 Bootstrap", " Chapter 14 Bootstrap This chapter deals with bootstrap. The students are expected to acquire the following knowledge: How to use bootstrap to generate coverage intervals. .fold-btn { float: right; margin: 5px 5px 0 0; } .fold { border: 1px solid black; min-height: 40px; } Exercise 14.1 Ideally, a \\(1-\\alpha\\) CI would have \\(1-\\alpha\\) coverage. That is, say a 95% CI should, in the long run, contain the true value of the parameter 95% of the time. In practice, it is impossible to assess the coverage of our CI method, because we rarely know the true parameter. In simulation, however, we can. Let’s assess the coverage of bootstrap percentile intervals. Pick a univariate distribution with readily available mean and one that you can easily sample from. Draw \\(n = 30\\) random samples from the chosen distribution and use the bootstrap (with large enough m) and percentile CI method to construct 95% CI. Repeat the process many times and count how many times the CI contains the true mean. That is, compute the actual coverage probability (don’t forget to include the standard error of the coverage probability!). What can you observe? Try one or two different distributions. What can you observe? Repeat (b) and (c) using BCa intervals (R package boot). How does the coverage compare to percentile intervals? As (d) but using intervals based on asymptotic normality (+/- 1.96 SE). How do results from (b), (d), and (e) change if we increase the sample size to n = 200? What about n = 5? library(boot) set.seed(0) nit &lt;- 1000 # Repeat the process &quot;many times&quot; alpha &lt;- 0.05 # CI parameter nboot &lt;- 100 # m parameter for bootstrap (&quot;large enough m&quot;) # f: change this to 200 or 5. nsample &lt;- 30 # n = 30 random samples from the chosen distribution. Comment out BCa code if it breaks. covers &lt;- matrix(nrow = nit, ncol = 3) covers_BCa &lt;- matrix(nrow = nit, ncol = 3) covers_asymp_norm &lt;- matrix(nrow = nit, ncol = 3) isin &lt;- function (x, lower, upper) { (x &gt; lower) &amp; (x &lt; upper) } for (j in 1:nit) { # Repeating many times # a: pick a univariate distribution - standard normal x1 &lt;- rnorm(nsample) # c: one or two different distributions - beta and poisson x2 &lt;- rbeta(nsample, 1, 2) x3 &lt;- rpois(nsample, 5) X1 &lt;- matrix(data = NA, nrow = nsample, ncol = nboot) X2 &lt;- matrix(data = NA, nrow = nsample, ncol = nboot) X3 &lt;- matrix(data = NA, nrow = nsample, ncol = nboot) for (i in 1:nboot) { X1[ ,i] &lt;- sample(x1, nsample, replace = T) X2[ ,i] &lt;- sample(x2, nsample, T) X3[ ,i] &lt;- sample(x3, nsample, T) } X1_func &lt;- apply(X1, 2, mean) X2_func &lt;- apply(X2, 2, mean) X3_func &lt;- apply(X3, 2, mean) X1_quant &lt;- quantile(X1_func, probs = c(alpha / 2, 1 - alpha / 2)) X2_quant &lt;- quantile(X2_func, probs = c(alpha / 2, 1 - alpha / 2)) X3_quant &lt;- quantile(X3_func, probs = c(alpha / 2, 1 - alpha / 2)) covers[j,1] &lt;- (0 &gt; X1_quant[1]) &amp; (0 &lt; X1_quant[2]) covers[j,2] &lt;- ((1 / 3) &gt; X2_quant[1]) &amp; ((1 / 3) &lt; X2_quant[2]) covers[j,3] &lt;- (5 &gt; X3_quant[1]) &amp; (5 &lt; X3_quant[2]) mf &lt;- function (x, i) return(mean(x[i])) bootX1 &lt;- boot(x1, statistic = mf, R = nboot) bootX2 &lt;- boot(x2, statistic = mf, R = nboot) bootX3 &lt;- boot(x3, statistic = mf, R = nboot) X1_quant_BCa &lt;- boot.ci(bootX1, type = &quot;bca&quot;)$bca X2_quant_BCa &lt;- boot.ci(bootX2, type = &quot;bca&quot;)$bca X3_quant_BCa &lt;- boot.ci(bootX3, type = &quot;bca&quot;)$bca covers_BCa[j,1] &lt;- (0 &gt; X1_quant_BCa[4]) &amp; (0 &lt; X1_quant_BCa[5]) covers_BCa[j,2] &lt;- ((1 / 3) &gt; X2_quant_BCa[4]) &amp; ((1 / 3) &lt; X2_quant_BCa[5]) covers_BCa[j,3] &lt;- (5 &gt; X3_quant_BCa[4]) &amp; (5 &lt; X3_quant_BCa[5]) # e: estimate mean and standard error # sample mean: x1_bar &lt;- mean(x1) x2_bar &lt;- mean(x2) x3_bar &lt;- mean(x3) # standard error (of the sample mean) estimate: sample standard deviation / sqrt(n) x1_bar_SE &lt;- sd(x1) / sqrt(nsample) x2_bar_SE &lt;- sd(x2) / sqrt(nsample) x3_bar_SE &lt;- sd(x3) / sqrt(nsample) covers_asymp_norm[j,1] &lt;- isin(0, x1_bar - 1.96 * x1_bar_SE, x1_bar + 1.96 * x1_bar_SE) covers_asymp_norm[j,2] &lt;- isin(1/3, x2_bar - 1.96 * x2_bar_SE, x2_bar + 1.96 * x2_bar_SE) covers_asymp_norm[j,3] &lt;- isin(5, x3_bar - 1.96 * x3_bar_SE, x3_bar + 1.96 * x3_bar_SE) } apply(covers, 2, mean) ## [1] 0.918 0.925 0.905 apply(covers, 2, sd) / sqrt(nit) ## [1] 0.008680516 0.008333333 0.009276910 apply(covers_BCa, 2, mean) ## [1] 0.927 0.944 0.927 apply(covers_BCa, 2, sd) / sqrt(nit) ## [1] 0.008230355 0.007274401 0.008230355 apply(covers_asymp_norm, 2, mean) ## [1] 0.939 0.937 0.930 apply(covers_asymp_norm, 2, sd) / sqrt(nit) ## [1] 0.007572076 0.007687008 0.008072494 Exercise 14.2 You are given a sample of independent observations from a process of interest: Index 1 2 3 4 5 6 7 8 X 7 2 4 6 4 5 9 10 Compute the plug-in estimate of mean and 95% symmetric CI based on asymptotic normality. Use the plug-in estimate of SE. Same as (a), but use the unbiased estimate of SE. Apply nonparametric bootstrap with 1000 bootstrap replications and estimate the 95% CI for the mean with percentile-based CI. # a x &lt;- c(7, 2, 4, 6, 4, 5, 9, 10) n &lt;- length(x) mu &lt;- mean(x) SE &lt;- sqrt(mean((x - mu)^2)) / sqrt(n) SE ## [1] 0.8915839 z &lt;- qnorm(1 - 0.05 / 2) c(mu - z * SE, mu + z * SE) ## [1] 4.127528 7.622472 # b SE &lt;- sd(x) / sqrt(n) SE ## [1] 0.9531433 c(mu - z * SE, mu + z * SE) ## [1] 4.006873 7.743127 # c set.seed(0) m &lt;- 1000 T_mean &lt;- function(x) {mean(x)} est_boot &lt;- array(NA, m) for (i in 1:m) { x_boot &lt;- x[sample(1:n, n, rep = T)] est_boot[i] &lt;- T_mean(x_boot) } quantile(est_boot, p = c(0.025, 0.975)) ## 2.5% 97.5% ## 4.250 7.625 Exercise 14.3 We are given a sample of 10 independent paired (bivariate) observations: Index 1 2 3 4 5 6 7 8 9 10 X 1.26 -0.33 1.33 1.27 0.41 -1.54 -0.93 -0.29 -0.01 2.40 Y 2.64 0.33 0.48 0.06 -0.88 -2.14 -2.21 0.95 0.83 1.45 Compute Pearson correlation between X and Y. Use the cor.test() from R to estimate a 95% CI for the estimate from (a). Apply nonparametric bootstrap with 1000 bootstrap replications and estimate the 95% CI for the Pearson correlation with percentile-based CI. Compare CI from (b) and (c). Are they similar? How would the bootstrap estimation of CI change if we were interested in Spearman or Kendall correlation instead? x &lt;- c(1.26, -0.33, 1.33, 1.27, 0.41, -1.54, -0.93, -0.29, -0.01, 2.40) y &lt;- c(2.64, 0.33, 0.48, 0.06, -0.88, -2.14, -2.21, 0.95, 0.83, 1.45) # a cor(x, y) ## [1] 0.6991247 # b res &lt;- cor.test(x, y) res$conf.int[1:2] ## [1] 0.1241458 0.9226238 # c set.seed(0) m &lt;- 1000 n &lt;- length(x) T_cor &lt;- function(x, y) {cor(x, y)} est_boot &lt;- array(NA, m) for (i in 1:m) { idx &lt;- sample(1:n, n, rep = T) # !!! important to use same indices to keep dependency between x and y est_boot[i] &lt;- T_cor(x[idx], y[idx]) } quantile(est_boot, p = c(0.025, 0.975)) ## 2.5% 97.5% ## 0.2565537 0.9057664 # d # Yes, but the bootstrap CI is more narrow. # e # We just use the functions for Kendall/Spearman coefficients instead: T_kendall &lt;- function(x, y) {cor(x, y, method = &quot;kendall&quot;)} T_spearman &lt;- function(x, y) {cor(x, y, method = &quot;spearman&quot;)} # Put this in a function that returns the CI bootstrap_95_ci &lt;- function(x, y, t, m = 1000) { n &lt;- length(x) est_boot &lt;- array(NA, m) for (i in 1:m) { idx &lt;- sample(1:n, n, rep = T) # !!! important to use same indices to keep dependency between x and y est_boot[i] &lt;- t(x[idx], y[idx]) } quantile(est_boot, p = c(0.025, 0.975)) } bootstrap_95_ci(x, y, T_kendall) ## 2.5% 97.5% ## -0.08108108 0.78378378 bootstrap_95_ci(x, y, T_spearman) ## 2.5% 97.5% ## -0.1701115 0.8867925 Exercise 14.4 In this problem we will illustrate the use of the nonparametric bootstrap for estimating CIs of regression model coefficients. Load the longley dataset from base R with data(longley). Use lm() to apply linear regression using “Employed” as the target (dependent) variable and all other variables as the predictors (independent). Using lm() results, print the estimated regression coefficients and standard errors. Estimate 95% CI for the coefficients using +/- 1.96 * SE. Use nonparametric bootstrap with 100 replications to estimate the SE of the coefficients from (b). Compare the SE from (c) with those from (b). # a data(longley) # b res &lt;- lm(Employed ~ . , longley) tmp &lt;- data.frame(summary(res)$coefficients[,1:2]) tmp$LB &lt;- tmp[,1] - 1.96 * tmp[,2] tmp$UB &lt;- tmp[,1] + 1.96 * tmp[,2] tmp ## Estimate Std..Error LB UB ## (Intercept) -3.482259e+03 8.904204e+02 -5.227483e+03 -1.737035e+03 ## GNP.deflator 1.506187e-02 8.491493e-02 -1.513714e-01 1.814951e-01 ## GNP -3.581918e-02 3.349101e-02 -1.014616e-01 2.982320e-02 ## Unemployed -2.020230e-02 4.883997e-03 -2.977493e-02 -1.062966e-02 ## Armed.Forces -1.033227e-02 2.142742e-03 -1.453204e-02 -6.132495e-03 ## Population -5.110411e-02 2.260732e-01 -4.942076e-01 3.919994e-01 ## Year 1.829151e+00 4.554785e-01 9.364136e-01 2.721889e+00 # c set.seed(0) m &lt;- 100 n &lt;- nrow(longley) T_coef &lt;- function(x) { lm(Employed ~ . , x)$coefficients } est_boot &lt;- array(NA, c(m, ncol(longley))) for (i in 1:m) { idx &lt;- sample(1:n, n, rep = T) est_boot[i,] &lt;- T_coef(longley[idx,]) } SE &lt;- apply(est_boot, 2, sd) SE ## [1] 1.826011e+03 1.605981e-01 5.693746e-02 8.204892e-03 3.802225e-03 ## [6] 3.907527e-01 9.414436e-01 # Show the standard errors around coefficients library(ggplot2) library(reshape2) df &lt;- data.frame(index = 1:7, bootstrap_SE = SE, lm_SE = tmp$Std..Error) melted_df &lt;- melt(df[2:nrow(df), ], id.vars = &quot;index&quot;) # Ignore bias which has a really large magnitude ggplot(melted_df, aes(x = index, y = value, fill = variable)) + geom_bar(stat=&quot;identity&quot;, position=&quot;dodge&quot;) + xlab(&quot;Coefficient&quot;) + ylab(&quot;Standard error&quot;) # + scale_y_continuous(trans = &quot;log&quot;) # If you want to also plot bias Exercise 14.5 This exercise shows a shortcoming of the bootstrap method when using the plug in estimator for the maximum. Compute the 95% bootstrap CI for the maximum of a standard normal distribution. Compute the 95% bootstrap CI for the maximum of a binomial distribution with n = 15 and p = 0.2. Repeat (b) using p = 0.9. Why is the result different? # bootstrap CI for maximum alpha &lt;- 0.05 T_max &lt;- function(x) {max(x)} # Equal to T_max = max bootstrap &lt;- function(x, t, m = 1000) { n &lt;- length(x) values &lt;- rep(0, m) for (i in 1:m) { values[i] &lt;- t(sample(x, n, replace = T)) } quantile(values, probs = c(alpha / 2, 1 - alpha / 2)) } # a # Meaningless, as the normal distribution can yield arbitrarily large values. x &lt;- rnorm(100) bootstrap(x, T_max) ## 2.5% 97.5% ## 1.819425 2.961743 # b x &lt;- rbinom(100, size = 15, prob = 0.2) # min = 0, max = 15 bootstrap(x, T_max) ## 2.5% 97.5% ## 6 7 # c x &lt;- rbinom(100, size = 15, prob = 0.9) # min = 0, max = 15 bootstrap(x, T_max) ## 2.5% 97.5% ## 15 15 # Observation: to estimate the maximum, we need sufficient probability mass near the maximum value the distribution can yield. # Using bootstrap is pointless when there is too little mass near the true maximum. # In general, bootstrap will fail when estimating the CI for the maximum. Exercise 14.6 (Practical - and fictional - coverage interval comparison) In this exercise, we investigate how different kinds of CI’s behave as we vary the number of measurements. The story behind the data: it’s 2025 and we’ve discovered that Slovenia has rich deposits of a rare mineral called Moustachium, which can be used to accelerate moustache growth. This mineral is highly sought, so the government has decided to contract two different companies to provide information on where to begin mining. Both companies investigated mining sites in each statistical region and gave their best estimate of the average Moustachium concentration in tonnes per square kilometer. The Data Science team has been called to estimate the uncertainty in these estimates and help avoid mining in the wrong region. Generate synthetic data with the script below: set.seed(0) library(comprehenr) regions &lt;- c(&quot;pomurska&quot;, &quot;podravska&quot;, &quot;koroska&quot;, &quot;savinjska&quot;, &quot;zasavska&quot;, &quot;posavska&quot;, &quot;JV Slovenija&quot;, &quot;primorsko-notranjska&quot;, &quot;osrednjeslovenska&quot;, &quot;gorenjska&quot;, &quot;goriska&quot;, &quot;obalno-kraska&quot;) region_rates &lt;- seq(1.3, 2.3, length.out=length(regions)) region_rates &lt;- region_rates[sample.int(length(regions), length(regions))] make_dataset &lt;- function(n_contractors) { measurements &lt;- matrix(nrow=length(regions), ncol=n_contractors) for (i in 1:length(regions)) { measurements[i,] &lt;- rgamma(n_contractors, 5.0, region_rates[i]) } df &lt;- data.frame(measurements) row.names(df) &lt;- regions names(df) &lt;- to_vec(for(i in 1:n_contractors) paste(&quot;Contractor&quot;, i)) return(df) } set.seed(0) df_2025 &lt;- make_dataset(2) set.seed(0) df_2027 &lt;- make_dataset(10) set.seed(0) df_2028 &lt;- make_dataset(100) set.seed(0) df_2029 &lt;- make_dataset(1000) saveRDS(df_2025, file=&quot;moustachium_2025.Rda&quot;) saveRDS(df_2027, file=&quot;moustachium_2027.Rda&quot;) saveRDS(df_2028, file=&quot;moustachium_2028.Rda&quot;) saveRDS(df_2029, file=&quot;moustachium_2029.Rda&quot;) Estimate the average concentration for different regions. Estimate the average concentration uncertainty using 95% CI’s (asymptotic normality with biased and unbiased standard error, standard bootstrap CI, bootstrap percentile CI). Visualize uncertainties with a histogram and discuss the best location to start mining. The year is 2027 and the government has decided to contract 10 companies. Rerun the code with new measurements and discuss how CI’s change. Technological advancements in robotics have enabled site surveys on a massive scale. Repeat the last point for 100 surveyor robots in 2028 and 1000 surveyor robots in 2029. library(ggplot2) library(dplyr) library(data.table) set.seed(0) input_dataset_path = &quot;moustachium_2025.Rda&quot; # Change this for points d and e output_plot_path = &quot;moustachium_2025.pdf&quot; # Change this for points d and e df &lt;- readRDS(input_dataset_path) # Data comes from here n_contractors &lt;- ncol(df) results_df &lt;- data.frame(region=row.names(df)) # Store CI bounds here # 1. average concentration for different mining sites results_df$average_concetration &lt;- rowMeans(df) # CI for the mean based on asymptotic normality (biased SE estimate) biased_SE &lt;- sqrt(apply(df, 1, function(vec) {sum((vec - mean(vec))^2) / length(vec)}) / n_contractors) results_df$ci95.an.biased_var.low &lt;- results_df$average_concetration - 1.96 * biased_SE results_df$ci95.an.biased_var.high &lt;- results_df$average_concetration + 1.96 * biased_SE # CI for the mean based on asymptotic normality (unbiased SE estimate) unbiased_SE &lt;- sqrt(apply(df, 1, var) / n_contractors) results_df$ci95.an.unbiased_var.low &lt;- results_df$average_concetration - 1.96 * unbiased_SE results_df$ci95.an.unbiased_var.high &lt;- results_df$average_concetration + 1.96 * unbiased_SE # Standard bootstrap CI with 1000 samples bootstrap_variance &lt;- function(data, n_samples) { # n_samples is m in pseudocode output &lt;- numeric(n_samples) for (i in 1:n_samples) { index &lt;- sample(1:length(data), length(data), rep = TRUE) resampled_data &lt;- data[index] output[i] &lt;- mean(resampled_data) } return(var(output)) } bootstrap_1000_sd &lt;- sqrt(apply(df, 1, function(vec){bootstrap_variance(vec, 1000)})) results_df$ci95.bootstrap.standard.1000.low &lt;- results_df$average_concetration - 1.96 * bootstrap_1000_sd results_df$ci95.bootstrap.standard.1000.high &lt;- results_df$average_concetration + 1.96 * bootstrap_1000_sd # Bootstrap percentile CI with 1000 samples bootstrap_quantile &lt;- function(data, functional, n_samples, probs) { # n_samples is m in pseudocode output &lt;- numeric(n_samples) for (i in 1:n_samples) { index &lt;- sample(1:length(data), length(data), rep = TRUE) resampled_data &lt;- data[index] output[i] &lt;- functional(resampled_data) } return(quantile(output, probs=probs)) } results_df$ci95.bootstrap.percentile.1000.low &lt;- apply(df, 1, function(vec){bootstrap_quantile(vec, mean, 1000, 0.025)}) results_df$ci95.bootstrap.percentile.1000.high &lt;- apply(df, 1, function(vec){bootstrap_quantile(vec, mean, 1000, 0.975)}) results_df ## region average_concetration ci95.an.biased_var.low ## 1 pomurska 2.814731 1.5351811 ## 2 podravska 2.646518 1.5358919 ## 3 koroska 2.010216 0.5956186 ## 4 savinjska 4.618001 4.4057369 ## 5 zasavska 2.458873 2.0050840 ## 6 posavska 2.153802 1.9001244 ## 7 JV Slovenija 2.433503 1.6860397 ## 8 primorsko-notranjska 3.165394 2.9640430 ## 9 osrednjeslovenska 3.696875 3.5592419 ## 10 gorenjska 1.341931 0.2784547 ## 11 goriska 2.767328 2.3255569 ## 12 obalno-kraska 1.580711 1.4533751 ## ci95.an.biased_var.high ci95.an.unbiased_var.low ci95.an.unbiased_var.high ## 1 4.094281 1.005174095 4.624288 ## 2 3.757144 1.075855548 4.217180 ## 3 3.424813 0.009673183 4.010759 ## 4 4.830264 4.317814385 4.918187 ## 5 2.912662 1.817118318 3.100628 ## 6 2.407479 1.795047746 2.512556 ## 7 3.180965 1.376430415 3.490575 ## 8 3.366746 2.880640556 3.450148 ## 9 3.834508 3.502232367 3.891518 ## 10 2.405407 -0.162051549 2.845913 ## 11 3.209099 2.142569481 3.392086 ## 12 1.708047 1.400630772 1.760792 ## ci95.bootstrap.standard.1000.low ci95.bootstrap.standard.1000.high ## 1 1.5397542 4.089708 ## 2 1.5388631 3.754173 ## 3 0.5492603 3.471171 ## 4 4.4062860 4.829715 ## 5 1.9938049 2.923942 ## 6 1.9010514 2.406552 ## 7 1.6932573 3.173748 ## 8 2.9670216 3.363767 ## 9 3.5602064 3.833544 ## 10 0.2845999 2.399262 ## 11 2.3293359 3.205320 ## 12 1.4543352 1.707087 ## ci95.bootstrap.percentile.1000.low ci95.bootstrap.percentile.1000.high ## 1 1.8914878 3.737975 ## 2 1.8451596 3.447876 ## 3 0.9895308 3.030901 ## 4 4.4648444 4.771157 ## 5 2.1314473 2.786299 ## 6 1.9707640 2.336840 ## 7 1.8941800 2.972825 ## 8 3.0201118 3.310677 ## 9 3.5975676 3.796183 ## 10 0.5745928 2.109269 ## 11 2.4485735 3.086082 ## 12 1.4888334 1.672589 # Visualization: we use a bar chart with uncertainty bands plot_moustachium_per_region &lt;- function(region_names, average, ci_low, ci_high) { df_visualization &lt;- data.frame(region=region_names, average=average, low=ci_low, high=ci_high) ggplot(df_visualization, aes(x=region, y=average)) + geom_bar(stat=&quot;identity&quot;) } mask &lt;- endsWith(colnames(results_df), &quot;low&quot;) mask[c(1, 2)] &lt;- T results_df_low &lt;- results_df[, mask] colnames(results_df_low) &lt;- gsub(&#39;.low&#39;,&#39;&#39;, colnames(results_df_low)) mask &lt;- endsWith(colnames(results_df), &quot;high&quot;) mask[c(1, 2)] &lt;- T results_df_high &lt;- results_df[, mask] colnames(results_df_high) &lt;- gsub(&#39;.high&#39;,&#39;&#39;, colnames(results_df_high)) long_results_df_low &lt;- melt(setDT(results_df_low), id.vars=c(&quot;region&quot;, &quot;average_concetration&quot;)) names(long_results_df_low) &lt;- c(&quot;region&quot;, &quot;average_concentration&quot;, &quot;variable&quot;, &quot;low&quot;) long_results_df_high &lt;- melt(setDT(results_df_high), id.vars=c(&quot;region&quot;, &quot;average_concetration&quot;)) names(long_results_df_high) &lt;- c(&quot;region&quot;, &quot;average_concentration&quot;, &quot;variable&quot;, &quot;high&quot;) long_results_df &lt;- merge(long_results_df_low, long_results_df_high, by=c(&quot;region&quot;, &quot;variable&quot;, &quot;average_concentration&quot;), all=T) moustachium_plot &lt;- ggplot(long_results_df, aes(x=region, y=average_concentration)) + geom_bar(stat=&quot;identity&quot;, position=&quot;dodge&quot;, alpha=0.2) + geom_errorbar(aes(ymin=low, ymax=high, color=variable), width=0.2, position=position_dodge(0.9)) + scale_x_discrete(guide = guide_axis(angle = 45)) + ylim(-1, 8) # ggsave(plot=moustachium_plot, width=12, height=8, dpi=300, filename=output_plot_path) moustachium_plot # Visualization: we can also use a map. Circle size denotes concentration in region, low transparency denotes high uncertainty. library(maps) map_data_slo &lt;- map_data(&#39;world&#39;)[map_data(&#39;world&#39;)$region == &quot;Slovenia&quot;,] map_df &lt;- long_results_df[long_results_df$variable == &quot;ci95.an.biased_var&quot;, ] # VERY approximate longitudes and latitudes for different regions. map_df$long &lt;- rep(0, nrow(map_df)) map_df$lat &lt;- rep(0, nrow(map_df)) map_df[map_df$region == &quot;gorenjska&quot;]$long &lt;- 14.2 map_df[map_df$region == &quot;gorenjska&quot;]$lat &lt;- 46.3 map_df[map_df$region == &quot;goriska&quot;]$long &lt;- 13.85 map_df[map_df$region == &quot;goriska&quot;]$lat &lt;- 46.0 map_df[map_df$region == &quot;obalno-kraska&quot;]$long &lt;- 13.9 map_df[map_df$region == &quot;obalno-kraska&quot;]$lat &lt;- 45.65 map_df[map_df$region == &quot;osrednjeslovenska&quot;]$long &lt;- 14.5 map_df[map_df$region == &quot;osrednjeslovenska&quot;]$lat &lt;- 46. map_df[map_df$region == &quot;primorsko-notranjska&quot;]$long &lt;- 14.3 map_df[map_df$region == &quot;primorsko-notranjska&quot;]$lat &lt;- 45.7 map_df[map_df$region == &quot;zasavska&quot;]$long &lt;- 15 map_df[map_df$region == &quot;zasavska&quot;]$lat &lt;- 46.1 map_df[map_df$region == &quot;savinjska&quot;]$long &lt;- 15.2 map_df[map_df$region == &quot;savinjska&quot;]$lat &lt;- 46.25 map_df[map_df$region == &quot;posavska&quot;]$long &lt;- 15.4 map_df[map_df$region == &quot;posavska&quot;]$lat &lt;- 46 map_df[map_df$region == &quot;koroska&quot;]$long &lt;- 15.1 map_df[map_df$region == &quot;koroska&quot;]$lat &lt;- 46.5 map_df[map_df$region == &quot;podravska&quot;]$long &lt;- 15.7 map_df[map_df$region == &quot;podravska&quot;]$lat &lt;- 46.45 map_df[map_df$region == &quot;pomurska&quot;]$long &lt;- 16.2 map_df[map_df$region == &quot;pomurska&quot;]$lat &lt;- 46.65 map_df[map_df$region == &quot;JV Slovenija&quot;]$long &lt;- 15. map_df[map_df$region == &quot;JV Slovenija&quot;]$lat &lt;- 45.7 map_df$ci_size &lt;- (map_df$high - map_df$low) map_df$ci_y &lt;- map_df$lat - 0.05 map_df$ci_label &lt;- sprintf(&quot;(%.2f, %.2f)&quot;, map_df$low, map_df$high) map_df$avg_label &lt;- sprintf(&quot;%.2f&quot;, map_df$average_concentration) country_plot &lt;- ggplot() + # First layer: worldwide map geom_polygon(data = map_data(&quot;world&quot;), aes(x=long, y=lat, group = group), color = &#39;#9c9c9c&#39;, fill = &#39;#f3f3f3&#39;) + # Second layer: Country map geom_polygon( data = map_data_slo, aes(x=long, y=lat, group = group), color=&#39;darkgreen&#39;, fill=&#39;green&#39;, alpha=0.2 ) + geom_point(data=map_df, aes(x=long, y=lat, fill=region, size=average_concentration, alpha=ci_size), color=&quot;black&quot;, pch=21) + geom_text(data=map_df, aes(x=long, y=ci_y, label=ci_label), size=3) + geom_text(data=map_df, aes(x=long, y=lat, label=avg_label), size=3) + scale_size_continuous(range = c(3, 12), trans = &quot;exp&quot;) + scale_alpha_continuous(range = c(0.15, 0.75), trans = &quot;reverse&quot;) + ggtitle(&quot;Estimated average Moustachium concentration with 95% CI&quot;) + coord_cartesian(xlim=c(13.2, 16.7), ylim=c(45.4, 47.)) # ggsave(plot=country_plot, width=18, height=12, dpi=300, filename=&quot;country.pdf&quot;) country_plot "],["404.html", "Page not found", " Page not found The page you requested cannot be found (perhaps it was moved or renamed). You may want to try searching to find the page's new location, or use the table of contents to find the page you are looking for. "]]