Introduction to R

values

 x <- 3
area_hectares <- 1.0    # doesn't print anything
area_hectares           # typing the name of the object prints the value of `area_hectares`
(area_hectares <- 1.0)  # and so does putting parenthesis around the call 
area_hectares  * 2.47
area_hectares <- 2.5
area_hectares * 2.47
area_acres <- area_hectares * 2.47
area_hectares <- 50
sqrt(64)

# or provide the input to the function as a variable:
a <- 64
sqrt(a)

# we can also assign the output to a new variable:
b <- sqrt(a)
b
round(3.14159)
#> [1] 3
round(3.14159, digits = 2)
#> [1] 3.14
round(3.14159, 2)
#> [1] 3.14
round(digits = 2, x = 3.14159)
#> [1] 3.14
?barplot
args(lm)
#> function (formula, data, subset, weights, na.action, method = "qr", 
#>     model = TRUE, x = FALSE, y = FALSE, qr = TRUE, singular.ok = TRUE, 
#>     contrasts = NULL, offset, ...) 
#> NULL
??kruskal
# iris is an example data frame that comes with R and 
# head() is a function that returns the first part of the data frame
dput(head(iris)) 
#> structure(list(Sepal.Length = c(5.1, 4.9, 4.7, 4.6, 5, 5.4), 
#>     Sepal.Width = c(3.5, 3, 3.2, 3.1, 3.6, 3.9), Petal.Length = c(1.4, 
#>     1.4, 1.3, 1.5, 1.4, 1.7), Petal.Width = c(0.2, 0.2, 0.2, 
#>     0.2, 0.2, 0.4), Species = structure(c(1L, 1L, 1L, 1L, 1L, 
#>     1L), levels = c("setosa", "versicolor", "virginica"), class = "factor")), row.names = c(NA, 
#> 6L), class = "data.frame")
saveRDS(iris, file="/tmp/iris.rds")
some_data <- readRDS(file="~/Downloads/iris.rds")
sessionInfo()
#> R version 4.5.1 (2025-06-13)
#> Platform: aarch64-apple-darwin20
#> Running under: macOS Sequoia 15.6.1
#> 
#> Matrix products: default
#> BLAS:   /Library/Frameworks/R.framework/Versions/4.5-arm64/Resources/lib/libRblas.0.dylib 
#> LAPACK: /Library/Frameworks/R.framework/Versions/4.5-arm64/Resources/lib/libRlapack.dylib;  LAPACK version 3.12.1
#> 
#> locale:
#> [1] en_US.UTF-8/en_US.UTF-8/en_US.UTF-8/C/en_US.UTF-8/en_US.UTF-8
#> 
#> time zone: America/Los_Angeles
#> tzcode source: internal
#> 
#> attached base packages:
#> [1] stats     graphics  grDevices utils     datasets  methods   base     
#> 
#> other attached packages:
#>  [1] lubridate_1.9.4 forcats_1.0.0   stringr_1.5.1   dplyr_1.1.4    
#>  [5] purrr_1.1.0     readr_2.1.5     tidyr_1.3.1     tibble_3.3.0   
#>  [9] ggplot2_3.5.2   tidyverse_2.0.0
#> 
#> loaded via a namespace (and not attached):
#>  [1] gtable_0.3.6       jsonlite_2.0.0     compiler_4.5.1     tidyselect_1.2.1  
#>  [5] jquerylib_0.1.4    scales_1.4.0       yaml_2.3.10        fastmap_1.2.0     
#>  [9] R6_2.6.1           generics_0.1.4     knitr_1.50         bookdown_0.44     
#> [13] bslib_0.9.0        pillar_1.11.0      RColorBrewer_1.1-3 tzdb_0.5.0        
#> [17] rlang_1.1.6        cachem_1.1.0       stringi_1.8.7      xfun_0.53         
#> [21] sass_0.4.10        timechange_0.3.0   cli_3.6.5          withr_3.0.2       
#> [25] magrittr_2.0.3     digest_0.6.37      grid_4.5.1         rstudioapi_0.17.1 
#> [29] hms_1.1.3          lifecycle_1.0.4    vctrs_0.6.5        evaluate_1.0.4    
#> [33] glue_1.8.0         farver_2.1.2       rmarkdown_2.29     tools_4.5.1       
#> [37] pkgconfig_2.0.3    htmltools_0.5.8.1
area_hectares <- c(21, 34, 39, 54, 55)
area_hectares
#> [1] 21 34 39 54 55
length(area_hectares)
#> [1] 5
class(area_hectares)
#> [1] "numeric"
str(area_hectares)
#>  num [1:5] 21 34 39 54 55
area_hectares <- c(area_hectares, 90) # add to the end of the vector
area_hectares <- c(30, area_hectares) # add to the beginning of the vector
area_hectares
#> [1] 30 21 34 39 54 55 90
animals <- c("mouse", "rat", "dog", "octopus")
class(animals)
#> [1] "character"
has_tail <- c(TRUE, TRUE, TRUE, FALSE)
has_tail 
#> [1]  TRUE  TRUE  TRUE FALSE
class(has_tail)
#> [1] "logical"
num_char <- c(1, 2, 3, 'a')
num_logical <- c(1, 2, 3, TRUE)
char_logical <- c('a', 'b', 'c', TRUE)
tricky <- c(1, 2, 3, '4')
animals[2]
#> [1] "rat"
animals[c(3, 2)]
#> [1] "dog" "rat"
animals[2:4]
#> [1] "rat"     "dog"     "octopus"
animals[-2]
#> [1] "mouse"   "dog"     "octopus"
animals[-c(1:3)]
#> [1] "octopus"
more_animals <- animals[c(1, 2, 3, 2, 1, 4)]
more_animals
#> [1] "mouse"   "rat"     "dog"     "rat"     "mouse"   "octopus"
has_tail # this is a logical vector
#> [1]  TRUE  TRUE  TRUE FALSE
animals[has_tail] # we use it here in the [ ] to subset
#> [1] "mouse" "rat"   "dog"
animals[animals == "frog" | animals == "rat"] 
#> [1] "rat"
animals %in% c("dog", "rat") # this creates the logical vector
#> [1] FALSE  TRUE  TRUE FALSE
animals[animals %in% c("dog", "rat")] # we use it here in the [ ] to subset
#> [1] "rat" "dog"
# The same, but here is how I would typically do it:
animals_to_find <- c("dog", "rat") # create a vector with the values you are looking for
animals[animals %in% animals_to_find] # apply it in the condition here
#> [1] "rat" "dog"
area_hectares > 50    # will return logicals with TRUE for the indices that meet the condition
#> [1] FALSE FALSE FALSE FALSE  TRUE  TRUE  TRUE
## so we can use this to select only the values above 50
area_hectares[area_hectares > 50]
#> [1] 54 55 90
area_hectares[area_hectares > 50 & area_hectares < 90]
#> [1] 54 55
x <- 1:4
x * 2
#> [1] 2 4 6 8
y <- 6:9
x + y
#> [1]  7  9 11 13
x:  1  2  3  4
    +  +  +  +
y:  6  7  8  9
---------------
    7  9 11 13
x > 2
#> [1] FALSE FALSE  TRUE  TRUE
a <- x > 3  # or, for clarity, a <- (x > 3)
a
#> [1] FALSE FALSE FALSE  TRUE
x <- 1:4
log(x)
#> [1] 0.0000000 0.6931472 1.0986123 1.3862944
x <- c(1, 2, 3)
y <- c(1, 2, 3, 4, 5, 6, 7)
x + y
#> Warning in x + y: longer object length is not a multiple of shorter object
#> length
#> [1] 2 4 6 5 7 9 8
x:  1  2  3  1  2  3  1
    +  +  +  +  +  +  +
y:  1  2  3  4  5  6  7
-----------------------
    2  4  6  5  7  9  8
age <- c(2, 4, 4, NA, 6, NA, 3)
mean(age)
#> [1] NA
sum(age)
#> [1] NA
mean(age, na.rm = TRUE)
#> [1] 3.8
sum(age, na.rm = TRUE)
#> [1] 19
# Extract elements which are not missing values.
## The ! character is also called the NOT operator
age[!is.na(age)]
#> [1] 2 4 4 6 3
# Returns the object with incomplete cases removed. The returned object is atomic.
na.omit(age)
#> [1] 2 4 4 6 3
#> attr(,"na.action")
#> [1] 4 6
#> attr(,"class")
#> [1] "omit"
## Count the number of missing values.
## The output of is.na() is a logical vector (TRUE/FALSE equivalent to 1/0) so the sum() function here is effectively counting
sum(is.na(age))
#> [1] 2
# Extract elements which are complete cases.
complete.cases(age) # this is a logical vector
#> [1]  TRUE  TRUE  TRUE FALSE  TRUE FALSE  TRUE
age[complete.cases(age)]
#> [1] 2 4 4 6 3
pop <- c(10,24,NA,18,NA,20)
y <- matrix(1:20, nrow=5,ncol=4) # generates 5 x 4 numeric matrix
y[,4]       # 4th column of matrix
y[3,]       # 3rd row of matrix
y[2:4,1:3]  # rows 2,3,4 of columns 1,2,3
myl <- list(id="ID_1", a_vector=animals, a_matrix=y, age=5.3) # example of a list with 4 components
myl[[2]] # 2nd component of the list
myl[["id"]] # component named id in list
mydf <- data.frame(ID=c(1:4),
                   Color=c("red", "white", "red", NA),
                   Passed=c(TRUE,TRUE,TRUE,FALSE),
                   Weight=c(99, 54, 85, 70),
                   Height=c(1.78, 1.67, 1.82, 1.59))

mydf
animal_data <- data.frame(animal=c("dog", "cat", "sea cucumber", "sea urchin),
                          feel=c("furry", "squishy", "spiny"),
                          weight=c(45, 8 1.1, 0.8))
# to install a package called "tidyverse", for example: (more on this later)
install.packages("tidyverse", dependencies = TRUE)
library(tidyverse)
require(tidyverse)

Introduction to R

Chapter 2 Getting Started with R

2.1 Creating objects in R

Challenge

2.2 Functions and their arguments

2.3 Seeking help

2.3.1 Generative AI Help

Challenge

2.3.2 How to ask for help

2.3.3 Where to ask for help?

2.3.4 Resources on getting help

2.4 Vectors and data types

Challenge

2.5 Subsetting vectors

2.5.1 Conditional subsetting

Challenge

2.6 Vectorization

Challenge

2.6.1 Operations on vectors of unequal length

2.7 Missing data

Challenge

2.8 Common R Data Structures

2.8.1 Matrix

2.8.2 List

2.8.3 Data frame

Challenge

2.9 Extending R base functionality

2.9.1 Installing additional packages

2.9.2 Make use of the installed packages

Challenge