data <- read_excel("myData.xlsx")
data
select(data, TEAMID:TEAM)
select(data, TEAMID, TEAM, PASERANK, GAMES)
select(data, TEAMID, TEAM, PASERANK, GAMES, WINPERCENT)
Summarize by group
data %>%
# Group by winpercent
group_by(WINPERCENT) %>%
# Sort it
arrange(PAKERANK)
Paker Rank decreases when win percent increases
data %>%
group_by(WINPERCENT) %>%
# Plot
ggplot(mapping = aes(x = PAKERANK, y = WINPERCENT)) +
geom_point(aes(size = TEAMID), alpha = 0.3)
grouping multiple variables
data %>%
group_by(WINPERCENT, PAKERANK, TEAM) %>%
summarise(count = n()) %>%
ungroup()