Week 8: Code along 7

Pivoting

long to wide form

table4a_long <- table4a %>%
    pivot_longer(cols=c('1999', '2000'), 
                 names_to = "year",
                 values_to = "cases")

Wide to long form

table4a_long %>%
    pivot_wider(names_from = year,
                values_from = cases)

## # A tibble: 3 × 3
##   country     `1999` `2000`
##   <chr>        <dbl>  <dbl>
## 1 Afghanistan    745   2666
## 2 Brazil       37737  80488
## 3 China       212258 213766

Seperating and Uniting

separate a column

table3_sep <- table3 %>%
    separate(col = rate, into = c("cases", "population"))

Unite two columns

table3_sep %>%
    unite(col = "rate", cases:population, sep = "/")

## # A tibble: 6 × 3
##   country      year rate             
##   <chr>       <dbl> <chr>            
## 1 Afghanistan  1999 745/19987071     
## 2 Afghanistan  2000 2666/20595360    
## 3 Brazil       1999 37737/172006362  
## 4 Brazil       2000 80488/174504898  
## 5 China        1999 212258/1272915272
## 6 China        2000 213766/1280428583

Missing Values

stocks <- tibble(
  year   = c(2015, 2015, 2015, 2015, 2016, 2016, 2016),
  qtr    = c(   1,    2,    3,    4,    2,    3,    4),
  return = c(1.88, 0.59, 0.35,   NA, 0.92, 0.17, 2.66)
)

stocks %>%
    pivot_wider(names_from = year, values_from = return)

## # A tibble: 4 × 3
##     qtr `2015` `2016`
##   <dbl>  <dbl>  <dbl>
## 1     1   1.88  NA   
## 2     2   0.59   0.92
## 3     3   0.35   0.17
## 4     4  NA      2.66

bikes  <- tibble(
  bike_model   = c("A", "A", "B", "B", "C"),
  material    = c("steel", "steel", "aluminum", "aluminum", "steel"),
  price = c(100, 200, 300, 400, 500))

bikes %>%
    pivot_wider(names_from = bike_model, values_from = price)

## Warning: Values from `price` are not uniquely identified; output will contain list-cols.
## • Use `values_fn = list` to suppress this warning.
## • Use `values_fn = {summary_fun}` to summarise duplicates.
## • Use the following dplyr code to identify duplicates.
##   {data} |>
##   dplyr::summarise(n = dplyr::n(), .by = c(material, bike_model)) |>
##   dplyr::filter(n > 1L)

## # A tibble: 2 × 4
##   material A         B         C        
##   <chr>    <list>    <list>    <list>   
## 1 steel    <dbl [2]> <NULL>    <dbl [1]>
## 2 aluminum <NULL>    <dbl [2]> <NULL>

bikes %>%
    complete(bike_model, material)

## # A tibble: 8 × 3
##   bike_model material price
##   <chr>      <chr>    <dbl>
## 1 A          aluminum    NA
## 2 A          steel      100
## 3 A          steel      200
## 4 B          aluminum   300
## 5 B          aluminum   400
## 6 B          steel       NA
## 7 C          aluminum    NA
## 8 C          steel      500

treatment <- tribble(
  ~ person,           ~ treatment, ~response,
  "Derrick Whitmore", 1,           7,
  NA,                 2,           10,
  NA,                 3,           9,
  "Katherine Burke",  1,           4
)
treatment %>%
    fill(person, .direction = "up")

## # A tibble: 4 × 3
##   person           treatment response
##   <chr>                <dbl>    <dbl>
## 1 Derrick Whitmore         1        7
## 2 Katherine Burke          2       10
## 3 Katherine Burke          3        9
## 4 Katherine Burke          1        4

Week 8: Code along 7

R for data science: chapter 12

Joe Jesseman

2024-10-22

Tidy data

Pivoting

long to wide form

Wide to long form

Seperating and Uniting

separate a column

Unite two columns

Missing Values