library(tidyverse)

── Attaching core tidyverse packages ──────────────────────── tidyverse 2.0.0 ──
✔ dplyr     1.1.3     ✔ readr     2.1.4
✔ forcats   1.0.0     ✔ stringr   1.5.0
✔ ggplot2   3.4.4     ✔ tibble    3.2.1
✔ lubridate 1.9.3     ✔ tidyr     1.3.0
✔ purrr     1.0.2     
── Conflicts ────────────────────────────────────────── tidyverse_conflicts() ──
✖ dplyr::filter() masks stats::filter()
✖ dplyr::lag()    masks stats::lag()
ℹ Use the conflicted package (<http://conflicted.r-lib.org/>) to force all conflicts to become errors

scores <- 
  tibble(
    name = c("mike", "carol", "greg", "marcia", "peter", "jan", "bobby", "cindy", "alice"),
    school = c("south", "south", "south", "south", "north", "north", "north", "south", "south"),
    teacher = c("johnson", "johnson", "johnson", "johnson",  "smith", "smith", "smith", "perry", "perry"),
    sex = c("male", "female", "male", "female", "male", "female", "male", "female", "female"),
    math_score = c(4, 3, 2, 4, 3, 4, 5, 4, 5),
    reading_score = c(1, 5, 2, 4, 5, 4, 1, 5, 4)
)

scores

print(scores)

# A tibble: 9 × 6
  name   school teacher sex    math_score reading_score
  <chr>  <chr>  <chr>   <chr>       <dbl>         <dbl>
1 mike   south  johnson male            4             1
2 carol  south  johnson female          3             5
3 greg   south  johnson male            2             2
4 marcia south  johnson female          4             4
5 peter  north  smith   male            3             5
6 jan    north  smith   female          4             4
7 bobby  north  smith   male            5             1
8 cindy  south  perry   female          4             5
9 alice  south  perry   female          5             4

scores %>% 
  slice(1:3)

scores_small <- scores %>% 
  slice(1:3)

scores_small

scores %>% head(3)

scores[1:3,]

scores %>% 
  arrange(desc(math_score))

scores %>% 
  arrange(name)

scores %>% 
  arrange(sex)

scores %>%
    arrange(school, teacher, sex, math_score, reading_score)

scores %>% 
  select(name, math_score, reading_score)

scores %>% 
  select(-sex)

scores %>% 
  select(-sex, -reading_score)

scores %>% 
  select(sex, everything())

scores %>% 
  filter(sex == "male" & school == "south")

scores %>% 
  filter(sex == "male", school == "south")

scores %>%
    filter(math_score > mean(math_score))

scores %>%
    filter(math_score >= 4 & reading_score >= 3)

scores %>%
    filter(math_score <= 3 | reading_score <= 3)

scores %>%
    filter(reading_score == 2 | reading_score == 3 | reading_score == 4)

scores %>%
    filter(reading_score >= 2 & reading_score <= 4)

scores %>%
    filter(reading_score %in% 2:4)

# ?substr

scores %>%
    filter(substr(name, 1, 1) == 'm')

scores %>% 
  group_by(teacher) %>% 
  filter(max(math_score) == 5)

scores %>%
    group_by(sex) %>%
    filter(mean(math_score) == 4)

scores %>% 
  mutate(
      math_score =  math_score * 10, 
      reading_score = reading_score * 10
  )

scores %>% 
    mutate(math_reading_avg = (math_score + reading_score) / 2)

scores %>% 
  mutate(high_math_achiever = math_score >= 4)

scores %>% 
  mutate(reading_score_centered = reading_score - mean(reading_score))

scores %>% 
    mutate(science_score = math_score**2 + reading_score) %>%
    arrange(desc(science_score))

scores %>% 
  group_by(sex) %>% 
  mutate(math_score_centered_by_sex = math_score - mean(math_score)) %>%
  arrange(desc(math_score_centered_by_sex))

scores %>% 
  group_by(teacher) %>% 
  mutate(math_score_centered_by_teacher = math_score - mean(math_score))

scores %>% 
  group_by(teacher) %>% 
  mutate(number_of_students_in_class = n())

scores %>% 
  summarize(math_score_mean = mean(math_score))

scores %>% 
  summarize(math_score_mean = mean(reading_score))

scores %>% 
  summarize(both_score_mean = mean((math_score + reading_score)/2))

scores %>% 
  group_by(school) %>% 
  summarize(min_math_score = min(math_score))

scores %>% 
  group_by(teacher) %>% 
  summarize(max_math_score = max(math_score))

scores %>% 
    group_by(teacher) %>% 
    summarize(max_math = max(math_score)) %>%
    filter(max_math == 5) %>%
    select(teacher)

scores %>% 
  group_by(sex) %>%
  summarize(min_reading_score = min(reading_score))

scores %>% 
  group_by(sex) %>% 
  summarize(mean_reading_score = mean(reading_score), 
            median_reading_score = median(reading_score), 
            n = n())

scores %>% 
  select(name, math_score) %>% 
  mutate(math_score_ec = math_score + 5) %>% 
  arrange(math_score_ec)

scores %>% 
  select(-teacher) %>% 
  mutate(mean_score = (math_score + reading_score)/2) %>% 
  arrange(mean_score)

scores %>% 
  filter(teacher != "smith") %>% 
  group_by(sex) %>% 
  summarize(mean_math_score = mean(math_score))

scores %>% 
  filter(sex == "female", school == "south") %>% 
  summarize(min_reading_score = min(reading_score),
            max_reading_score = max(reading_score),
            median_reading_score = median(reading_score))

scores %>% 
  group_by(school, teacher) %>% 
  summarize(max_math_score = max(math_score)) %>% 
  filter(school == "south")

`summarise()` has grouped output by 'school'. You can override using the
`.groups` argument.

scores %>% 
  filter(school == "south") %>% 
  group_by(teacher) %>% 
  summarize(max_math_score = max(math_score))

scores %>% 
  group_by(school, teacher) %>% 
  summarize(max_math_score = max(math_score), .groups = 'keep') %>% 
  filter(school == "south")

name	school	teacher	sex	math_score	reading_score
<chr>	<chr>	<chr>	<chr>	<dbl>	<dbl>
mike	south	johnson	male	4	1
carol	south	johnson	female	3	5
greg	south	johnson	male	2	2
marcia	south	johnson	female	4	4
peter	north	smith	male	3	5
jan	north	smith	female	4	4
bobby	north	smith	male	5	1
cindy	south	perry	female	4	5
alice	south	perry	female	5	4

A tibble: 1 × 1
math_score_mean
<dbl>
3.777778

A tibble: 1 × 1
math_score_mean
<dbl>
3.444444

A tibble: 1 × 1
both_score_mean
<dbl>
3.611111

R Dplyr Exercises¶

Exercise 1¶

Exercise 2¶

Exercise 3¶

Exercise 4¶

Part 1: Arrange¶

Exercise 5¶

Exercise 6¶

Exercise 7¶

Exercise 8¶

Part 2: Select¶

Exercise 9¶

Exercise 10¶

Exercise 11¶

Exercise 12¶

Part 3: Filter¶

Exercise 13¶

Exercise 14¶

Exercise 15¶

Exercise 16¶

Exercise 17¶

Exercise 18¶

Part 4: Filter with groups¶

Exercise 19¶

Exercise 20¶

Part 5: Mutate¶

Exercise 21¶

Exercise 22¶

Exercise 23¶

Exercise 24¶

Exercise 25¶

Part 6: Mutate with groups¶

Exercise 26¶

Exercise 27¶

Exercise 28¶

Part 7: Summarize¶

Exercise 29¶

Exercise 30¶

Exercise 31¶

Part 8: Summarize with groups¶

Exercise 32¶

Exercise 33¶

Exercise 34¶

Exercise 35¶

Part 9: Combining verbs¶

Exercise 36¶

Exercise 37¶

Exercise 38¶

Exercise 39¶

Exercise 40¶

Credits¶