- Identify features of data that drive analyses
- Think critically about what the data could tell you
- Start thinking about the distributional forms for data
1 April 2026
Distributions of data
Classic “coin toss”
set.seed(514) ## flip a coin 1000 times x <- rbinom(n = 1000, size = 1, prob = 0.5) ## count tails (0) and heads (1) table(x)
## x ## 0 1 ## 511 489
Number of times birds were resighted
set.seed(514) ## 37 banded birds; number of resightings x <- rpois(n = 37, lambda = 1) ## count up resightings table(x)
## x ## 0 1 2 3 4 5 ## 7 18 5 5 1 1
Surviving offspring
set.seed(514) ## 1357 tagged smolts; probability of survival is 0.05 x <- rbinom(n = 1357, size = 1, prob = 0.05) ## number of mortalities (0) and survivors (1) table(x) # p ~= 0.0593
## x ## 0 1 ## 1281 76
Common “bell-shaped curve”
## normal distribution (mean = 0, sd = 1)
curve(dnorm(x, mean = 0, sd = sqrt(1)), from = -4, to = 4,
main = "", xlab = "", ylab = "Density", bty = "n",
cex.lab = 1.5, cex.axis = 1.2, lwd = 2, col = "#32006e")
## log-normal distribution (mean = 2, sd = 0.7)
curve(dlnorm(x, meanlog = 2, sdlog = 0.7), from = 0, to = 20,
main = "", xlab = "", ylab = "Density", bty = "n",
cex.lab = 1.5, cex.axis = 1.2, lwd = 2, col = "#32006e")
## beta distribution (mean = 2/3)
curve(dbeta(x, shape1 = 6, shape2 = 3), from = 0, to = 1,
main = "", xlab = "", ylab = "Density", bty = "n",
cex.lab = 1.5, cex.axis = 1.2, lwd = 2, col = "#32006e")