Import data
# excel file
mydata <- read_excel("../00_data/myData.xlsx")
data
Apply the following dplyr verbs to your data
Filter rows
filter(mydata, peak_billboard_position == "1")
Arrange rows
arrange(mydata, desc(genre))
Select columns
select(mydata, 3)
Add columns
mutate(mydata,
years_between = artist_birth_year_sum - debut_album_release_year) %>%
select(years_between)
Summarize by groups
mydata %>%
# Group by album release year
group_by(release_year) %>%
# Calculate average release year
summarise(release_year = mean(year, na.rm = TRUE)) %>%
# Sort is
arrange(release_year)