Mastering Data Visualization Using R, Quarto, and the Tidyverse

An Introduction to R

c(31, -50, 9.3, 29, -4.483, 93)
[1]  31.000 -50.000   9.300  29.000  -4.483  93.000
v <- c(31, -50, 9.3, 29, -4.483, 93)
v
[1]  31.000 -50.000   9.300  29.000  -4.483  93.000
class(v)
[1] "numeric"
is.numeric(v)
[1] TRUE
w <- c(4, 3, 1, 2, 6, 5)
v + w
[1]  35.000 -47.000  10.300  31.000   1.517  98.000
w - 2
[1]  2  1 -1  0  4  3
sum(w)
[1] 21
3:10
[1]  3  4  5  6  7  8  9 10
3.5:-5.5
 [1]  3.5  2.5  1.5  0.5 -0.5 -1.5 -2.5 -3.5 -4.5 -5.5
seq(from = 0.5, to = 20.1, by = 0.4)
 [1]  0.5  0.9  1.3  1.7  2.1  2.5  2.9  3.3  3.7  4.1  4.5  4.9  5.3  5.7  6.1
[16]  6.5  6.9  7.3  7.7  8.1  8.5  8.9  9.3  9.7 10.1 10.5 10.9 11.3 11.7 12.1
[31] 12.5 12.9 13.3 13.7 14.1 14.5 14.9 15.3 15.7 16.1 16.5 16.9 17.3 17.7 18.1
[46] 18.5 18.9 19.3 19.7 20.1
compass <- c("North", "East", "South", "West")
class(compass)
[1] "character"
is.character(compass)
[1] TRUE
valid <- c(TRUE, TRUE, FALSE, FALSE, TRUE)
class(valid)
[1] "logical"
class("TRUE")
[1] "character"
is.logical(valid)
[1] TRUE
is.logical("TRUE")
[1] FALSE
all(valid)
[1] FALSE
x <- c(2, 1, 3)
y <- c(2, 4, 3)
x == y
[1]  TRUE FALSE  TRUE
!valid
[1] FALSE FALSE  TRUE  TRUE FALSE
credible <- c(TRUE, FALSE, TRUE, FALSE, FALSE)
valid & credible
[1]  TRUE FALSE FALSE FALSE FALSE
valid | credible
[1]  TRUE  TRUE  TRUE FALSE  TRUE
mix_attempt <- c(1, "a")
class(mix_attempt)
[1] "character"
mix_attempt
[1] "1" "a"
"1" + "1"
Error in "1" + "1": non-numeric argument to binary operator
s <- seq(from = 0.5, to = 20.1, by = 0.4)
s[1]
[1] 0.5
s[3:6]
[1] 1.3 1.7 2.1 2.5
head(s)
[1] 0.5 0.9 1.3 1.7 2.1 2.5
tail(s)
[1] 18.1 18.5 18.9 19.3 19.7 20.1
repetitions <- c(-5, -5, 2, 2, 2)
unique(repetitions)
[1] -5  2
nums <- c(1, 2, 3, NA, 5, 6)
msg <- c("papa", NA, "bravo", "echo", NA)
nums + 2
[1]  3  4  5 NA  7  8
nums == NA
[1] NA NA NA NA NA NA
is.na(nums)
[1] FALSE FALSE FALSE  TRUE FALSE FALSE
mean(nums)
[1] NA
mean(nums, na.rm = TRUE)
[1] 3.4
?seq
??variance
??"standard deviation"
print(.packages())
[1] "stats"     "graphics"  "grDevices" "utils"     "datasets"  "methods"  
[7] "base"     
print(.packages(all.available = TRUE))
find.package("dplyr")
remove.packages("dplyr")
install.packages("dplyr")
help(package = "dplyr")
starwars
Error: object 'starwars' not found
dplyr::starwars
# A tibble: 87 × 14
   name     height  mass hair_color skin_color eye_color birth_year sex   gender
   <chr>     <int> <dbl> <chr>      <chr>      <chr>          <dbl> <chr> <chr> 
 1 Luke Sk…    172    77 blond      fair       blue            19   male  mascu…
 2 C-3PO       167    75 <NA>       gold       yellow         112   none  mascu…
 3 R2-D2        96    32 <NA>       white, bl… red             33   none  mascu…
 4 Darth V…    202   136 none       white      yellow          41.9 male  mascu…
 5 Leia Or…    150    49 brown      light      brown           19   fema… femin…
 6 Owen La…    178   120 brown, gr… light      blue            52   male  mascu…
 7 Beru Wh…    165    75 brown      light      blue            47   fema… femin…
 8 R5-D4        97    32 <NA>       white, red red             NA   none  mascu…
 9 Biggs D…    183    84 black      light      brown           24   male  mascu…
10 Obi-Wan…    182    77 auburn, w… fair       blue-gray       57   male  mascu…
# ℹ 77 more rows
# ℹ 5 more variables: homeworld <chr>, species <chr>, films <list>,
#   vehicles <list>, starships <list>
library(dplyr)

Attaching package: 'dplyr'
The following objects are masked from 'package:stats':

    filter, lag
The following objects are masked from 'package:base':

    intersect, setdiff, setequal, union
starwars
# A tibble: 87 × 14
   name     height  mass hair_color skin_color eye_color birth_year sex   gender
   <chr>     <int> <dbl> <chr>      <chr>      <chr>          <dbl> <chr> <chr> 
 1 Luke Sk…    172    77 blond      fair       blue            19   male  mascu…
 2 C-3PO       167    75 <NA>       gold       yellow         112   none  mascu…
 3 R2-D2        96    32 <NA>       white, bl… red             33   none  mascu…
 4 Darth V…    202   136 none       white      yellow          41.9 male  mascu…
 5 Leia Or…    150    49 brown      light      brown           19   fema… femin…
 6 Owen La…    178   120 brown, gr… light      blue            52   male  mascu…
 7 Beru Wh…    165    75 brown      light      blue            47   fema… femin…
 8 R5-D4        97    32 <NA>       white, red red             NA   none  mascu…
 9 Biggs D…    183    84 black      light      brown           24   male  mascu…
10 Obi-Wan…    182    77 auburn, w… fair       blue-gray       57   male  mascu…
# ℹ 77 more rows
# ℹ 5 more variables: homeworld <chr>, species <chr>, films <list>,
#   vehicles <list>, starships <list>
head(pull(starwars, var = eye_color))
[1] "blue"   "yellow" "red"    "yellow" "brown"  "blue"  
head(pull(.data = starwars, var = eye_color, name = name))
Luke Skywalker          C-3PO          R2-D2    Darth Vader    Leia Organa 
        "blue"       "yellow"          "red"       "yellow"        "brown" 
     Owen Lars 
        "blue" 
p_1 <- pull(.data = starwars, var = eye_color, name = NULL)
p_2 <- pull(.data = starwars, var = eye_color)
identical(p_1, p_2)
[1] TRUE
pull(var = eye_color, name = NULL)
Error: object 'eye_color' not found
p_3 <- pull(.data = starwars, var = eye_color, name = name)
p_4 <- pull(name = name, .data = starwars, var = eye_color)
identical(p_3, p_4)
[1] TRUE
p_5 <- pull(.data = starwars, var = eye_color, name = name)
p_6 <- pull(starwars, eye_color, name)
identical(p_5, p_6)
[1] TRUE
head(pull(starwars, eye_color, name = name))
Luke Skywalker          C-3PO          R2-D2    Darth Vader    Leia Organa 
        "blue"       "yellow"          "red"       "yellow"        "brown" 
     Owen Lars 
        "blue" 
pull(starwars, var = eye_color, name = name)
tmp_1 <- sample(rivers, 5)
tmp_2 <- sum(tmp_1)
tmp_3 <- pnorm(tmp_2, mean = 2000, sd = 1000)
print(tmp_3, digits = 5)
print(pnorm(sum(sample(rivers, 5)), mean = 2000, sd = 1000), digits = 5)
rivers |>
  sample(5) |>
  sum() |>
  pnorm(mean = 2000, sd = 1000) |>
  print(digits = 5)
# Okay but unnecessarily complicated:
q |>
  pnorm(mean = 2000, sd = 1000)

# Better:
pnorm(q, mean = 2000, sd = 1000)
message("Hello, world!")
say_hello <- function(name) {
  message("Hello, ", name, "!")
}
say_hello("parallel universe")
Hello, parallel universe!
function_name <- function(arg1, arg2, ...) {
  # Body of the function
}
say_hello <- function(name = "world") {
  message("Hello, ", name, "!")
}
say_hello()
Hello, world!
say_hello
function (name = "world") 
{
    message("Hello, ", name, "!")
}
increment <- function(x) {
  return(x + 1)
}
y <- increment(5)
y
[1] 6
increment <- function(x) {
  return(x + 1)
  message("We never get here.")
}
increment(5)
[1] 6
increment <- function(x) {
  x + 1
}
country_sizes <- c(15, 7, 15, 69, 69, 82)
min_rank(country_sizes)
[1] 2 1 2 4 4 6
min_rank(desc(country_sizes))
[1] 4 6 4 2 2 1
days <- c("Wednesday", "Saturday", "Thursday", "Sunday", NA)
if_else(
  days %in% c("Saturday", "Sunday"),
  "Weekend",
  "Weekday"
)
[1] "Weekday" "Weekend" "Weekday" "Weekend" "Weekday"
days <- c("Wednesday", "Saturday", "Thursday", "Sunday", NA, "foo")
case_match(
  days,
  "Saturday" ~ "Saturday",
  "Sunday" ~ "Sunday",
  c("Monday", "Tuesday", "Wednesday", "Thursday", "Friday") ~ "Weekday",
  .default = "Unknown"
)
[1] "Weekday"  "Saturday" "Weekday"  "Sunday"   "Unknown"  "Unknown" 
library(tidyverse)
ny_mayor <- tibble(
  borough = c("Bronx", "Brooklyn", "Manhattan", "Queens", "Staten Island"),
  de_blasio = c(117712, 254755, 190312, 171867, 25466),
  malliotakis = c(23715, 74343, 53853, 94911, 70125),
  other = c(3138, 10602, 10186, 8974, 2747)
)
ny_mayor
# A tibble: 5 × 4
  borough       de_blasio malliotakis other
  <chr>             <dbl>       <dbl> <dbl>
1 Bronx            117712       23715  3138
2 Brooklyn         254755       74343 10602
3 Manhattan        190312       53853 10186
4 Queens           171867       94911  8974
5 Staten Island     25466       70125  2747
class(ny_mayor)
[1] "tbl_df"     "tbl"        "data.frame"
is.data.frame(ny_mayor)
[1] TRUE
starwars
# A tibble: 87 × 14
   name     height  mass hair_color skin_color eye_color birth_year sex   gender
   <chr>     <int> <dbl> <chr>      <chr>      <chr>          <dbl> <chr> <chr> 
 1 Luke Sk…    172    77 blond      fair       blue            19   male  mascu…
 2 C-3PO       167    75 <NA>       gold       yellow         112   none  mascu…
 3 R2-D2        96    32 <NA>       white, bl… red             33   none  mascu…
 4 Darth V…    202   136 none       white      yellow          41.9 male  mascu…
 5 Leia Or…    150    49 brown      light      brown           19   fema… femin…
 6 Owen La…    178   120 brown, gr… light      blue            52   male  mascu…
 7 Beru Wh…    165    75 brown      light      blue            47   fema… femin…
 8 R5-D4        97    32 <NA>       white, red red             NA   none  mascu…
 9 Biggs D…    183    84 black      light      brown           24   male  mascu…
10 Obi-Wan…    182    77 auburn, w… fair       blue-gray       57   male  mascu…
# ℹ 77 more rows
# ℹ 5 more variables: homeworld <chr>, species <chr>, films <list>,
#   vehicles <list>, starships <list>
nrow(starwars)
[1] 87
ncol(starwars)
[1] 14
head(starwars)
# A tibble: 6 × 14
  name      height  mass hair_color skin_color eye_color birth_year sex   gender
  <chr>      <int> <dbl> <chr>      <chr>      <chr>          <dbl> <chr> <chr> 
1 Luke Sky…    172    77 blond      fair       blue            19   male  mascu…
2 C-3PO        167    75 <NA>       gold       yellow         112   none  mascu…
3 R2-D2         96    32 <NA>       white, bl… red             33   none  mascu…
4 Darth Va…    202   136 none       white      yellow          41.9 male  mascu…
5 Leia Org…    150    49 brown      light      brown           19   fema… femin…
6 Owen Lars    178   120 brown, gr… light      blue            52   male  mascu…
# ℹ 5 more variables: homeworld <chr>, species <chr>, films <list>,
#   vehicles <list>, starships <list>
glimpse(starwars)
Rows: 87
Columns: 14
$ name       <chr> "Luke Skywalker", "C-3PO", "R2-D2", "Darth Vader", "Leia Or…
$ height     <int> 172, 167, 96, 202, 150, 178, 165, 97, 183, 182, 188, 180, 2…
$ mass       <dbl> 77.0, 75.0, 32.0, 136.0, 49.0, 120.0, 75.0, 32.0, 84.0, 77.…
$ hair_color <chr> "blond", NA, NA, "none", "brown", "brown, grey", "brown", N…
$ skin_color <chr> "fair", "gold", "white, blue", "white", "light", "light", "…
$ eye_color  <chr> "blue", "yellow", "red", "yellow", "brown", "blue", "blue",…
$ birth_year <dbl> 19.0, 112.0, 33.0, 41.9, 19.0, 52.0, 47.0, NA, 24.0, 57.0, …
$ sex        <chr> "male", "none", "none", "male", "female", "male", "female",…
$ gender     <chr> "masculine", "masculine", "masculine", "masculine", "femini…
$ homeworld  <chr> "Tatooine", "Tatooine", "Naboo", "Tatooine", "Alderaan", "T…
$ species    <chr> "Human", "Droid", "Droid", "Human", "Human", "Human", "Huma…
$ films      <list> <"A New Hope", "The Empire Strikes Back", "Return of the J…
$ vehicles   <list> <"Snowspeeder", "Imperial Speeder Bike">, <>, <>, <>, "Imp…
$ starships  <list> <"X-wing", "Imperial shuttle">, <>, <>, "TIE Advanced x1",…
View(starwars)
ny_mayor$borough
[1] "Bronx"         "Brooklyn"      "Manhattan"     "Queens"       
[5] "Staten Island"
```{r}
#| label: read-csv
#| message: false

epl <- read_csv("epl_table.csv")
```
```{r}
#| label: read-xlsx

library(readxl) # Move this line to the top of the QMD file
epl <- read_xlsx("epl_table.xlsx")
```
state.name
 [1] "Alabama"        "Alaska"         "Arizona"        "Arkansas"      
 [5] "California"     "Colorado"       "Connecticut"    "Delaware"      
 [9] "Florida"        "Georgia"        "Hawaii"         "Idaho"         
[13] "Illinois"       "Indiana"        "Iowa"           "Kansas"        
[17] "Kentucky"       "Louisiana"      "Maine"          "Maryland"      
[21] "Massachusetts"  "Michigan"       "Minnesota"      "Mississippi"   
[25] "Missouri"       "Montana"        "Nebraska"       "Nevada"        
[29] "New Hampshire"  "New Jersey"     "New Mexico"     "New York"      
[33] "North Carolina" "North Dakota"   "Ohio"           "Oklahoma"      
[37] "Oregon"         "Pennsylvania"   "Rhode Island"   "South Carolina"
[41] "South Dakota"   "Tennessee"      "Texas"          "Utah"          
[45] "Vermont"        "Virginia"       "Washington"     "West Virginia" 
[49] "Wisconsin"      "Wyoming"       
class(state.name)
[1] "character"
state.region
 [1] South         West          West          South         West         
 [6] West          Northeast     South         South         South        
[11] West          West          North Central North Central North Central
[16] North Central South         South         Northeast     South        
[21] Northeast     North Central North Central South         North Central
[26] West          North Central West          Northeast     Northeast    
[31] West          Northeast     South         North Central North Central
[36] South         West          Northeast     Northeast     South        
[41] North Central South         South         West          Northeast    
[46] South         West          South         North Central West         
Levels: Northeast South North Central West
class(state.region)
[1] "factor"
is.factor(state.region)
[1] TRUE
factor(c("Pomposo", "Colossale", "Pomposo", "Regolare"))
[1] Pomposo   Colossale Pomposo   Regolare 
Levels: Colossale Pomposo Regolare
sizes <- factor(
  c("Pomposo", "Colossale", "Pomposo", "Regolare"),
  levels = c("Modesto", "Regolare", "Pomposo", "Colossale")
)
sizes
[1] Pomposo   Colossale Pomposo   Regolare 
Levels: Modesto Regolare Pomposo Colossale
volumes <- c(
  "Colossale",
  "Minusculo",
  "Regolare",
  "Enorme",
  "Modesto",
  "Piccolo",
  "Microscopico"
)
factor(volumes, levels = c("Modesto", "Regolare", "Pomposo", "Colossale"))
[1] Colossale <NA>      Regolare  <NA>      Modesto   <NA>      <NA>     
Levels: Modesto Regolare Pomposo Colossale
levels(sizes)
[1] "Modesto"   "Regolare"  "Pomposo"   "Colossale"
library(forcats)
fct_recode(
  sizes,
  m = "Modesto",
  r = "Regolare",
  p = "Pomposo",
  c = "Colossale"
)
[1] p c p r
Levels: m r p c
proportions <- factor(c("Pomposo", "Big", "r"))

# Here are the current levels
levels(proportions)
[1] "Big"     "Pomposo" "r"      
# Combine "Pomposo" and "Big" into the new category "p"
fct_collapse(proportions, p = c("Pomposo", "Big"))
[1] p p r
Levels: p r
fct_other(volumes, keep = c("Modesto", "Regolare", "Pomposo", "Colossale"))
[1] Colossale Other     Regolare  Other     Modesto   Other     Other    
Levels: Colossale Modesto Regolare Other
glimpse(gss_cat)
Rows: 21,483
Columns: 9
$ year    <int> 2000, 2000, 2000, 2000, 2000, 2000, 2000, 2000, 2000, 2000, 20…
$ marital <fct> Never married, Divorced, Widowed, Never married, Divorced, Mar…
$ age     <int> 26, 48, 67, 39, 25, 25, 36, 44, 44, 47, 53, 52, 52, 51, 52, 40…
$ race    <fct> White, White, White, White, White, White, White, White, White,…
$ rincome <fct> $8000 to 9999, $8000 to 9999, Not applicable, Not applicable, …
$ partyid <fct> "Ind,near rep", "Not str republican", "Independent", "Ind,near…
$ relig   <fct> Protestant, Protestant, Protestant, Orthodox-christian, None, …
$ denom   <fct> "Southern baptist", "Baptist-dk which", "No denomination", "No…
$ tvhours <int> 12, NA, 2, 4, 1, NA, 3, NA, 0, 3, 2, NA, 1, NA, 1, 7, NA, 3, 3…
relig <- pull(gss_cat, relig)
levels(relig)
 [1] "No answer"               "Don't know"             
 [3] "Inter-nondenominational" "Native american"        
 [5] "Christian"               "Orthodox-christian"     
 [7] "Moslem/islam"            "Other eastern"          
 [9] "Hinduism"                "Buddhism"               
[11] "Other"                   "None"                   
[13] "Jewish"                  "Catholic"               
[15] "Protestant"              "Not applicable"         
fct_count(relig)
# A tibble: 16 × 2
   f                           n
   <fct>                   <int>
 1 No answer                  93
 2 Don't know                 15
 3 Inter-nondenominational   109
 4 Native american            23
 5 Christian                 689
 6 Orthodox-christian         95
 7 Moslem/islam              104
 8 Other eastern              32
 9 Hinduism                   71
10 Buddhism                  147
11 Other                     224
12 None                     3523
13 Jewish                    388
14 Catholic                 5124
15 Protestant              10846
16 Not applicable              0
relig_descending <- fct_infreq(relig)
levels(relig_descending)
 [1] "Protestant"              "Catholic"               
 [3] "None"                    "Christian"              
 [5] "Jewish"                  "Other"                  
 [7] "Buddhism"                "Inter-nondenominational"
 [9] "Moslem/islam"            "Orthodox-christian"     
[11] "No answer"               "Hinduism"               
[13] "Other eastern"           "Native american"        
[15] "Don't know"              "Not applicable"         
fct_count(relig_descending)
# A tibble: 16 × 2
   f                           n
   <fct>                   <int>
 1 Protestant              10846
 2 Catholic                 5124
 3 None                     3523
 4 Christian                 689
 5 Jewish                    388
 6 Other                     224
 7 Buddhism                  147
 8 Inter-nondenominational   109
 9 Moslem/islam              104
10 Orthodox-christian         95
11 No answer                  93
12 Hinduism                   71
13 Other eastern              32
14 Native american            23
15 Don't know                 15
16 Not applicable              0
sizes
[1] Pomposo   Colossale Pomposo   Regolare 
Levels: Modesto Regolare Pomposo Colossale
sizes > "Pomposo"
Warning in Ops.factor(sizes, "Pomposo"): '>' not meaningful for factors
[1] NA NA NA NA
sizes_ord <- factor(
  c("Pomposo", "Colossale", "Pomposo", "Regolare"),
  levels = c("Modesto", "Regolare", "Pomposo", "Colossale"),
  ordered = TRUE
)
class(sizes_ord)
[1] "ordered" "factor" 
is.ordered(sizes_ord)
[1] TRUE
sizes_ord > "Pomposo"
[1] FALSE  TRUE FALSE FALSE
band_members
Error: object 'band_members' not found

Operator	Description
`x + y`	Sum of `x` and `y`
`x - y`	`y` subtracted from `x`
`x * y`	`x` multiplied by `y`
`x / y`	`x` divided by `y`
`x^y` or `x**y`	`x` raised to the power `y`
`x %/% y`	Integer division. Example: `7 %/% 3` returns `2`.
`x %% y`	`x` modulo `y` (i.e., remainder after integer division of `x` by `y`). Example: `7 %% 3` returns `1`.

Operator	Description: `TRUE` if and only if …
`x == y`	`x` equals `y`
`x != y`	`x` does not equal `y`
`x < y`	`x` is less than `y`
`x > y`	`x` is greater than `y`
`x <= y`	`x` is less than or equal to `y`
`x >= y`	`x` is greater than or equal to `y`
`x %in% y`	`x` is an element in `y`

Borough	de Blasio	Malliotakis	Other
Bronx	117,712	23,715	3,138
Brooklyn	254,755	74,343	10,602
Manhattan	190,312	53,853	10,186
Queens	171,867	94,911	8,974
Staten Island	25,466	70,125	2,747

Term	Definition
Argument	An input to a function, specified by position or by name. Some arguments may have default values.
Assignment operator (`<-`)	The symbol used to assign a value to a variable (e.g., `x <- 42`).
Conditional element selection	A method to select elements of a vector from a list of alternatives. The `if_else()` and `case_match()` functions in the dplyr package provide this functionality.
Data frame	A rectangular tabular object where rows are observations and columns represent variables. Each column is a vector, which can be retrieved using `dplyr::pull()` or `$`.
Dollar sign operator (`$`)	An operator to access a specific column of a data frame (e.g., `dfr$col_name`).
Double-colon operator (`::`)	An operator to access a specific object from a package without attaching the entire package. Usage: `dplyr::pull()`.
Factor	A data structure for categorical data. Observations are classified into categories that are stored in the `levels` attribute.
Function	An R object that performs a task dependent on input arguments. Functions are invoked by their name followed by parentheses (e.g., `sum(1:10)`).
Help operator (`?`)	Documentation shortcut. It opens R’s built-in help page of a known object. For example, `?seq` retrieves the help page of the `seq()` function.
Logical vector	A vector whose elements can only be `TRUE`, `FALSE`, or `NA`.
Missing value (`NA`)	A special placeholder indicating “Not available”.
Ordered factor	A factor with a defined order among its levels, enabling comparisons like `<` and `>`.
Package	A bundle of R functions, data, and documentation that extends R’s base capabilities. Packages can be loaded with `library()`.
Pipe operator (`\|>`)	An operator that passes the output of one expression as first argument to the next expression.
Tibble	A data-frame subclass with improved console output.
Vector	A R object whose elements all share the same class (e.g., `numeric`, `character`, or `logical`).

4.1 Vectors

4.1.1 Creating Vector-Valued Variables

4.1.2 Classes of Vectors

4.1.2.1 Numeric Vectors

4.1.2.1.1 Arithmetic Operators

4.1.2.1.2 Shortcuts for Creating Vectors Containing Numeric Sequences

4.1.2.2 Character Vectors

4.1.2.3 Logical Vectors

4.1.2.4 All Elements in a Vector Must Belong to the Same Class

4.1.3 Extracting Vector Elements

4.1.4 Section Summary: Vectors

4.2 Missing Values

4.3 Obtaining Help

4.3.1 R’s Built-in Documentation

4.3.2 Finding Help on the World Wide Web

4.3.3 Section Summary: Obtaining Help

4.4 Integrating Packages into Your Workflow

4.4.1 Installing a Package

4.4.2 Loading the Content of a Package

4.4.2.1 Referring to Package Content Using the Double-Colon Operator

4.4.2.2 Loading a Package Using library()

4.4.3 Section Summary: Packages

4.5 Functions

4.5.1 Passing Arguments to Functions

4.5.1.1 Arguments with Default Values

4.5.1.2 Argument Matching by Name

4.5.1.3 Argument Matching by Position

4.5.1.4 Mixed Matching

4.5.1.5 Pipes

4.5.2 Writing Functions

4.5.2.1 Function Syntax

4.5.2.2 Return Value of a Function

4.5.3 Section Summary: Functions

4.6 Ranking Vector Elements

4.7 Conditional Element Selection from a List of Alternatives

4.7.1 Using if_else() for Two-Way Conditional Selection

4.7.2 Using case_match() for Multi-Way Conditional Selection

4.7.3 Section Summary: Conditional Element Selection

4.8 Data Frames

4.8.1 Creating Data Frames From Scratch

4.8.2 Viewing Data Frames

4.8.3 Extracting Column Vectors with $

4.9 Importing Data

4.9.1 Importing CSV Files

4.9.2 Importing Excel Spreadsheets

4.10 Factors

4.10.1 Example: US States and Regions

4.10.2 Categorical Data

4.10.3 Creating Factors

4.10.4 Retrieving and Changing the Levels

4.10.5 Counting and Sorting Levels by Frequency

4.10.6 Ordered Factors

4.10.7 Section Summary: Factors

4.11 Conclusion

4.12 Exercise

4.4.2.2 Loading a Package Using `library()`

4.7.1 Using `if_else()` for Two-Way Conditional Selection

4.7.2 Using `case_match()` for Multi-Way Conditional Selection

4.8.3 Extracting Column Vectors with `$`