Import Data

flight <- read.csv("flight.csv")

Remove blank row

flightdf <- flight[-c(3),]

Replace missing values

flightdf$X[2] = 'Alaska'
flightdf$X[4] = 'AM WEST'

Rename columns

names(flightdf) <- c('airline', 'status', 'Los.Angeles', 'Phoenix', 'San.Diego', ' San.Francisco', 'Seattle')

Convert from wide to long data

long <- gather(flightdf, state, measurement, Los.Angeles:Seattle, factor_key = T)

Find average delay by state

delay_state <- long %>% filter(status == 'delayed') %>%
  group_by(airline, state) %>%
  summarise(avg_delay = mean(measurement, na.rm = TRUE)) %>%
  arrange(avg_delay)

Plot data

ggplot(delay_state, aes(x=airline, y=avg_delay, fill=state)) +
geom_col(position = "dodge") +
labs(x = "Airline", y = "Average delays")

Conclusion

The graph above reflects that on average AM West has a significant delay in flights at Phoenix and Alaska airline does not. Alaska airline has a significant delay in flights leaving from Seattle and AM west airline does not.